<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "http://jats.nlm.nih.gov/publishing/1.3/JATS-journalpublishing1-3.dtd">
<article article-type="review-article" dtd-version="1.3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PJS</journal-id>
<journal-id journal-id-type="publisher-id">Premier Journal of Science</journal-id>
<journal-id journal-id-type="pmc">PJS</journal-id>
<journal-title-group>
<journal-title>PJ SCIENCE</journal-title>
</journal-title-group>
<issn pub-type="epub">3049-9011</issn>
<publisher>
<publisher-name>Premier Science</publisher-name>
<publisher-loc>London, UK</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.70389/PJS.100043</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>REVIEW</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Cognitive science</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Social sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Social sciences</subject><subj-group><subject>Linguistics</subject><subj-group><subject>Grammar</subject><subj-group><subject>Phonology</subject><subj-group><subject>Syllables</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Engineering and technology</subject><subj-group><subject>Signal processing</subject><subj-group><subject>Speech signal processing</subject></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Cognitive science</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Social sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Mental health and psychiatry</subject><subj-group><subject>Schizophrenia</subject></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Bioassays and physiological analysis</subject><subj-group><subject>Electrophysiological techniques</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Physiology</subject><subj-group><subject>Electrophysiology</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Brain mapping</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Clinical medicine</subject><subj-group><subject>Clinical neurophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Cell biology</subject><subj-group><subject>Cellular types</subject><subj-group><subject>Animal cells</subject><subj-group><subject>Neurons</subject><subj-group><subject>Interneurons</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Cellular neuroscience</subject><subj-group><subject>Neurons</subject><subj-group><subject>Interneurons</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Bioassays and physiological analysis</subject><subj-group><subject>Electrophysiological techniques</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Physiology</subject><subj-group><subject>Electrophysiology</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Brain mapping</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Medicine and health sciences</subject><subj-group><subject>Clinical medicine</subject><subj-group><subject>Clinical neurophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group>
<subj-group subj-group-type="Discipline-v3"><subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group>
</article-categories>
<title-group>
<article-title>Machine Learning for Early Disease Diagnosis: A Review of Techniques in Healthcare Applications</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Faraz Manzoor</surname>
<given-names>Muhammad</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/Writing-original-draft/">Writing &#x2013; original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/review-editing/">Review and editing</role>
</contrib>
<aff id="aff001">Department of Artificial Intelligence, School of System and Technology, <institution>UMT</institution>, <city>Lahore</city>, <country>Pakistan</country></aff>
</contrib-group>
<author-notes>
<corresp id="cor001"><bold>Correspondence to:</bold> Muhammad Faraz Manzoor, <email>Faraz.Manzoor@umt.edu.pk</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>12</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<month>12</month>
<year>2024</year>
</pub-date>
<volume>6</volume>
<issue>1</issue>
<elocation-id>100043</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>11</month>
<year>2024</year>
</date>
<date date-type="rev-recd">
<day>04</day>
<month>12</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>05</day>
<month>12</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-year>2025</copyright-year>
<copyright-holder>Muhammad Faraz Manzoor</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.70389/PJS.2025.100043"/>
<abstract>
<p>Early disease detection has long been a cornerstone of healthcare, with the adage &#x201C;prevention is better than cure.&#x201D;.The rise of machine learning (ML) has revolutionized this field, enabling the analysis of vast medical data to predict health issues before they become clinically evident. Traditional detection methods, relying on manual examinations and patient history, are often limited by human error and subjectivity, especially as medical datasets grow in size and complexity. This review addresses the gap between conventional diagnostic methods and ML&#x2019;s potential in early disease detection. It explores various ML algorithms used across domains such as heart disease, diabetes, and cancer, and tracks the evolution of ML techniques from 2015 to 2024. The review also examines ethical and technical challenges, particularly concerning data privacy. Emerging trends in the field, such as the integration of ensemble learning and deep learning models, are also proposed. The significance of this work lies in its comprehensive overview of ML in early disease detection, highlighting its transformative potential in improving diagnosis accuracy, reducing healthcare costs, and enhancing patient outcomes.</p>
</abstract>
<kwd-group kwd-group-type="author">
<kwd>Machine learning</kwd>
<kwd>Early disease detection</kwd>
<kwd>Healthcare applications</kwd>
<kwd>Deep learning</kwd>
<kwd>Data privacy</kwd>
</kwd-group>
<counts>
<fig-count count="4"/>
<table-count count="7"/>
<page-count count="15"/>
</counts>
</article-meta>
</front>
<body>
<sec>
<title>
<ext-link ext-link-type="uri" xlink:href="https://premierscience.com/wp-content/uploads/2025/05/pjs-24-579.pdf">Source-File: pjs-24-579.pdf</ext-link>
</title>
</sec>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>Throughout history, healthcare has been guided by the aphorism &#x201C;prevention is better than cure.&#x201D; Early detection is not only better for the patient but also a huge drop in the strain on the healthcare system. This has led us into a new era of predictive potential for early disease detection via machine learning (ML), which has revolutionized how early disease detection is taking place, while the mainstays of early disease diagnosis have in the past relied on manual examination, patient history, and simple diagnostic tools. Physicians have long been taught to identify trends and departures from the norm and to base their choices on their clinical expertise. However, because they rely on human judgment, which is subjective and prone to error, these approaches are frequently constrained.<sup><xref ref-type="bibr" rid="ref1">1</xref></sup> Additionally, the vast and disjointed datasets produced by modern medicine may be too big for conventional approaches to handle. A rapidly evolving subset of artificial intelligence (AI), the ability to create algorithms that can look at data, pattern them, and predict future events is intriguing. ML techniques are a rapidly growing trend for early detection of diseases because they can process and analyze massive amounts of data, or &#x201C;big data&#x201D;. Because of this change in strategy, we have been able to build prediction models, along which patterns and connections that are potentially too subtle for us to pick up can now be learned and perceived.<sup><xref ref-type="bibr" rid="ref2">2</xref></sup></p>
<p>At the same time, one of the main advantages of ML in early disease diagnosis is that it can treat a huge number of factors simultaneously. For instance, ML algorithms can take many more inputs such as genetics, family history, and other personal behaviors and environmental situations, whereas traditional approaches might only look at a few different symptoms. An advantage of this method is that it allows for the measurement of illness risk more precisely and individually for each patient. ML approaches have been found to add value in a range of medical specialties. For example, in radiology, sophisticated imaging methods including computed tomography (CT) scans and magnetic resonance imaging (MRI) produce tens of millions of pixels of data that will surpass the capacity of the human radiologist to view in their entirety.<sup><xref ref-type="bibr" rid="ref3">3</xref></sup> ML algorithms can quickly filter through these photos, and automatically identify very small irregularities which the human eye may not detect. In much the same way, we are also using ML algorithms to improve our ability to analyze DNA sequences to find hereditary susceptibilities to disease. One approach to healthcare is iterative ML. The more data they can process, the better their algorithms tend to perform. Early disease identification is one place where this adaptability is especially helpful given that symptoms are often very complex and highly dynamic. ML algorithms have the tendency to increase the accuracy with which they can detect early illness markers when continuing learning and improvement in prediction.<sup><xref ref-type="bibr" rid="ref4">4</xref></sup></p>
<p>However, incorporating ML into early disease diagnosis is not without its challenges. Because medical data is sensitive, worries about data security and privacy continue to be the most pressing issues. Making sure ML models are visible and explicable is a second challenge; certain algorithms are &#x201C;black boxes&#x201D; which could prevent their clinical use. Furthermore, because historical data is not entirely equitable, it can skew healthcare outcomes for the patients who get it. Compared to traditional methods, ML for early disease diagnosis represents a paradigm change in healthcare. The fundamentals are covered by traditional approaches, but ML capabilities enable previously unattainable scales for processing large amounts of data and deriving useful insights. In order to effectively leverage the predictive power for early disease diagnosis and promote healthy populations and healthcare systems, medical specialists and data scientists will need to collaborate as technology continues to advance.<sup><xref ref-type="bibr" rid="ref5">5</xref></sup></p>
<p>The aim of this study is to explore the role of ML, ensemble learning (EL), and deep learning (DL) models in early disease detection, analyzing their evolution, common applications, and performance across various diseases. The study also examines the ethical and technical challenges associated with these technologies, particularly concerning data privacy, while proposing emerging trends for future advancements in the field. The contributions of the study are stated below:
<list list-type="roman-lower">
<list-item><p>Identification of common ML, EL, and DL models used in early disease prediction.</p></list-item>
<list-item><p>Analysis of the evolution of these models, along with an exploration of challenges and emerging trends in the field.</p></list-item>
</list></p>
<p>The rest of the article is organized as follows: Section 2 presents the architecture of the early disease prediction system, detailing the components and workflow. Section 3 explores various ML techniques applied to different disease diagnoses, highlighting their effectiveness. Section 4 provides a discussion of the findings and implications of the proposed methods. In Section 5, the challenges and opportunities in early disease detection are addressed, focusing on current limitations and potential advancements. Section 6 offers a glimpse into the future, discussing emerging trends and prospects in ML-driven early disease diagnostics. Finally, Section 7 concludes the article with a summary of key insights and future directions.</p>
</sec>
<sec id="sec002">
<title>Architecture of the Early Disease Prediction</title>
<p>The process starts with collecting medical datasets derived from various sources, including patient data and electronic health records. These raw datasets undergo preprocessing to clean, normalize, and organize the information, ensuring consistency and accuracy. Following this, feature extraction and selection are performed to identify and prioritize the most relevant features or variables for disease prediction, reducing dimensionality and improving computational efficiency.</p>
<p>Once the data is prepared, advanced computational methods are applied, including DL, ML, and optimization-based techniques. These methods analyze the data to identify patterns and relationships indicative of disease risks. The performance of these models is then evaluated using metrics like accuracy, precision, F-measure, and processing time. Based on this evaluation, the best-performing model is selected and used for disease prediction. The ultimate goal of this architecture is to facilitate accurate and efficient early detection of diseases, enabling timely medical intervention. The general architecture of early disease prediction is shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<object-id pub-id-type="doi">10.70389/journal.pjs.100043.g001</object-id>
<label>Fig 1</label>
<caption><title>General architecture of early disease prediction</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/05/pjs-24-579-Figure-1.jpg">Figure 1</ext-link></p>
</fig>
</sec>
<sec id="sec003">
<title>Machine Learning Techniques for Different Disease Diagnoses</title>
<p>Several authors and scholars have employed ML methods to diagnose illnesses. This section explains the significance and influence of different forms of ML-based disease diagnostics (MLBDD) that have been debated extensively. For example, as COVID-19 is a worldwide problem, a lot of research publications from 2020 to the present have concentrated on utilizing ML to diagnose COVID-19 disease, which is what we also gave priority to in this study. Heart disease, kidney disease, breast cancer, diabetes, Parkinson&#x2019;s, Alzheimer&#x2019;s, and COVID-19 are among the serious diseases; additional illnesses are briefly covered under the &#x201C;Other Diseases&#x201D; heading.</p>
</sec>
<sec id="sec004">
<title>Heart Disease</title>
<p>ML algorithms are used by most researchers and experts to detect heart problems.<sup><xref ref-type="bibr" rid="ref6">6</xref>, <xref ref-type="bibr" rid="ref7">7</xref></sup> For example, Ansari et al.<sup><xref ref-type="bibr" rid="ref6">6</xref></sup> introduced an automated method for diagnosing coronary heart disease based on neuro-fuzzy integrated systems, which achieved an accuracy of about 89&#x0025;. The absence of a thorough description of how the suggested approach might be applied in numerous situations, such as multiclass classification, enormous data processing, and unequal distribution of class, is one of the study&#x2019;s main flaws. Additionally, the model&#x2019;s prediction validity is uncertain, which has recently raised serious concerns in the medical community, particularly for patients who are unfamiliar with medical terminology. In order to identify irregular heartbeats, Rubin et al.<sup><xref ref-type="bibr" rid="ref8">8</xref></sup> used a deep convolutional neural network (CNN). The researchers of the study subsequently modified the loss function as a strategy to increase the training set&#x2019;s sensitivity and improve the specificity. They submitted their model to the PhysioNet classification computer competition in 2016. With an ultimate forecast of 0.95 specificity and 0.73 sensitivity, they place second in the competition.</p>
<p>In addition, algorithms based on the DL have been recently employed to identify heart disease. For example, Miao and Miao<sup><xref ref-type="bibr" rid="ref9">9</xref></sup> presented a DL method for determining electronic fetal monitoring (EFM) based on the multiclass morphologic pattern. The model identifies the morphologic pattern of patients with pregnancy problems. An F1 score of 0.85, an accuracy of 88.02&#x0025; and a precision of 85.01&#x0025; are some additional preliminary computational findings. The morphologic pattern of patients with pregnancy problems is identified using the model. Additional preliminary computational findings include an F-score of 0.85, an accuracy of 88.02&#x0025;, and a precision of 85.01&#x0025;. They acknowledged that a greater accuracy rate was a benefit of using a variety of dropout techniques to address the overfitting problems in that study, which also improved training time.</p>
<p>Khader Basha et al<sup><xref ref-type="bibr" rid="ref10">10</xref></sup> utilized a hybrid ML approach combining decision tree (DT) and AdaBoost to enhance coronary heart disease prediction, focusing on cardiac and kidney disorders. Their model&#x2019;s performance was measured by accuracy, true positive rate (TPR), and Specificity. Meanwhile, Chandrasekhar and Peddakrishna<sup><xref ref-type="bibr" rid="ref11">11</xref></sup> tested six algorithms (random forest, K-nearest neighbor, logistic regression (LR), Na&#x00EF;ve Bayes, gradient boosting, and AdaBoost) on Cleveland and IEEE DataPort datasets. Using GridSearchCV and fivefold cross-validation, LR achieved 90.16&#x0025; accuracy on Cleveland, while AdaBoost reached 90&#x0025; on IEEE DataPort. Their soft voting ensemble classifier further improved accuracy to 93.44&#x0025; (Cleveland) and 95&#x0025; (IEEE), outperforming individual models and prior studies.</p>
<p>Although there is a wealth of research on using ML to diagnose cardiac disease,<sup><xref ref-type="bibr" rid="ref12">12</xref></sup> none of it has addressed the difficulties associated with multiclass categorization of unbalanced data. In most situations, nevertheless, the model&#x2019;s capacity to explain the ultimate forecast is severely constrained. Some of the cited studies that employed ML and DL to identify heart disease are shown in <xref ref-type="table" rid="T1">Table 1</xref> of this article.</p>
<table-wrap id="T1">
<label>Table 1</label>
<caption>
<title>Comparison of Machine Learning Techniques in Heart Disease Detection</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Ref</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Algorithms Utilized</th>
<th valign="middle" align="left">Dataset Used</th>
<th valign="middle" align="left">Data Format</th>
<th valign="middle" align="left">Performance Metrics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref13">13</xref></td>
<td valign="middle" align="left">2021</td>
<td valign="middle" align="left">Gaussian Na&#x00EF;ve Bayes, Bernoulli &#x00ED; Bayes, RF</td>
<td valign="middle" align="left">Cleveland dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Gaussian Na&#x00EF;ve Bayes achieved an accuracy of 85.00&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref14">14</xref></td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">RF, CNN</td>
<td valign="middle" align="left">Cleveland dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Random forest achieved an accuracy of 80.33&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref15">15</xref></td>
<td valign="middle" align="left">2019</td>
<td valign="middle" align="left">Support vector machine (SVM)</td>
<td valign="middle" align="left">Cleveland database</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Accuracy observed across various methods ranged from 73&#x0025; to 91&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref16">16</xref></td>
<td valign="middle" align="left">2019</td>
<td valign="middle" align="left">Back-propagation neural network, logistic regression</td>
<td valign="middle" align="left">Cleveland dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">BNN achieved an accuracy of 85.07&#x0025;, while logistic regression achieved 92.58&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref17">17</xref></td>
<td valign="middle" align="left">2018</td>
<td valign="middle" align="left">SVM, Cuckoo Search-Optimized Neural Network</td>
<td valign="middle" align="left">Cleveland dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Support vector machine achieved an accuracy of 94.44&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref18">18</xref></td>
<td valign="middle" align="left">2017</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">MIT-BIH dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">For balanced data, accuracy was 94&#x0025;, whereas for imbalanced data, accuracy dropped to 89.07&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref19">19</xref></td>
<td valign="middle" align="left">2018</td>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">MIT-BIH dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Imbalanced data analysis yielded 97.77&#x0025; accuracy, while noise-free ECGs achieved 97.08&#x0025; accuracy.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref10">10</xref></td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">Decision tree, AdaBoost</td>
<td valign="middle" align="left">Cleveland</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">AdaBoost outperformed decision tree.</td>
</tr>
<tr>
<td valign="middle" align="left"><xref ref-type="bibr" rid="ref11">11</xref></td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">RF, KNN, logistic regression, Na&#x00EF;ve Bayes, gradient boosting, AdaBoost, soft voting ensemble</td>
<td valign="middle" align="left">Cleveland, IEEE DataPort</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Logistic regression achieved an accuracy of 90.16&#x0025;, while AdaBoost also achieved 90&#x0025;.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The studies presented focus on various ML algorithms applied to heart disease prediction using datasets like Cleveland and MIT-BIH. Key findings reveal that random forest (RF) and support vector machine (SVM) models consistently perform well, with RF achieving accuracies around 80&#x0025;&#x2013;85&#x0025; and SVM reaching up to 94.44&#x0025;. In some cases, ensemble methods like AdaBoost and soft voting ensemble showed competitive results, with LR achieving 90.16&#x0025;. Back-propagation neural networks and CNNs also performed strongly, with accuracy rates ranging from 89&#x0025; to 97&#x0025;, depending on data balance and noise levels. Overall, the studies highlight the effectiveness of both traditional and advanced ML techniques for heart disease prediction.</p>
</sec>
<sec id="sec005">
<title>Kidney Disease</title>
<p>Renal disease commonly referred to as kidney disease is nephropathy or kidney damage. Kidney disease patients have a reduced ability of kidney function, and if left untreated it can cause kidney failure. The National Kidney Foundation estimates that 10&#x0025; of the global population is affected by chronic kidney disease (CKD) and millions of people die annually because of inadequate care. Recent renal disease detection methods based on ML and DL may provide access to nations that cannot perform kidney disease diagnostic tests.<sup><xref ref-type="bibr" rid="ref20">20</xref></sup> In order to assess four distinct ML methods, Charleonnan et al.<sup><xref ref-type="bibr" rid="ref21">21</xref></sup> employed publicly accessible datasets: Using LR, SVM, K-nearest neighbors (KNN), and DT classifiers, the datasets were classified; the corresponding accuracy rates were 96.55&#x0025;, 98.3&#x0025;, 98.1&#x0025;, and 94.8&#x0025;. Aljaaf et al.<sup><xref ref-type="bibr" rid="ref22">22</xref></sup> compared RPART, SVM, LOGR, and MLP with the help of the same dataset as CKD used by Charleonnan et al.<sup><xref ref-type="bibr" rid="ref21">21</xref></sup> and observed that MLP is the best model that can identify CKD with 98.1&#x0025; accuracy. In order to detect prolonged kidney illness, Ma et al.<sup><xref ref-type="bibr" rid="ref23">23</xref></sup> use datasets that contain records from numerous sources. They discovered that the accuracy of their proposed heterogeneous modified artificial neural network (HMANN) model ranged from 87&#x0025; to 99&#x0025;. <xref ref-type="table" rid="T2">Table 2</xref> summarizes a few studies that employed ML and DL to identify kidney illness.</p>
<table-wrap id="T2">
<label>Table 2</label>
<caption>
<title>Comparison of Machine Learning Techniques in Kidney Disease Detection</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Study</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Algorithms Utilized</th>
<th valign="middle" align="left">Dataset Used</th>
<th valign="middle" align="left">Data Format</th>
<th valign="middle" align="left">Performance Metrics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">26</td>
<td valign="middle" align="left">2021</td>
<td valign="middle" align="left">Na&#x00EF;ve Bayes, decision tree, RF</td>
<td valign="middle" align="left">Chronic kidney disease dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Random forest achieved an accuracy of 100&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">27</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">Artificial neural network (c), kernel K-means clustering</td>
<td valign="middle" align="left">100 patient ultrasound images</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">ANN achieved an accuracy of 99.61&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">28</td>
<td valign="middle" align="left">2018</td>
<td valign="middle" align="left">Logistic regression, feedforward neural network, wide DL</td>
<td valign="middle" align="left">Chronic kidney disease dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Feedforward neural network attained an F1-score of 99&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">29</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">Convolutional neural network-support vector machine (CNN-SVM)</td>
<td valign="middle" align="left">Proprietary dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Accuracy of 97.67&#x0025; was accompanied by a sensitivity of 97.5&#x0025; and specificity of 97.83&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">30</td>
<td valign="middle" align="left">2019</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Proprietary dataset</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">CNN achieved an accuracy of 95&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">24</td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">XGBoost</td>
<td valign="middle" align="left">CKD dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">XGBoost attained an accuracy of 98.3&#x0025; with an F1-score of 98&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">25</td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">MLP</td>
<td valign="middle" align="left">400 patient data</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">MLP achieved an accuracy of 100&#x0025;.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Islam et al.<sup><xref ref-type="bibr" rid="ref24">24</xref></sup> explored the ability to use ML approaches to diagnose CKD and found that predictive modeling would greatly improve timely detection. In evaluating 12 ML classifiers, they concluded that XGBoost performed the best with accuracy, precision, recall, and F1-score, all reaching 0.98. Furthermore, Sawhney et al.<sup><xref ref-type="bibr" rid="ref25">25</xref></sup> developed a DL-based multi-layer perceptron classifier for CKD diagnosis, with 100&#x0025; accuracy by using data from 400 patients. Using deep neural networks (DNN) from the PyTorch library, their approach surpassed conventional models like SVM and Na&#x00EF;ve Bayes and proved that neural models can be used to handle nonlinear data and enhance diagnosis accuracy.</p>
<p>The studies on kidney disease detection using ML techniques show impressive results across various algorithms and datasets. RF and multi-layer perceptron (MLP) achieved perfect accuracy (100&#x0025;) in some studies, while other models like feedforward neural networks, XGBoost, and artificial neural networks (ANN) reported high performance with accuracies above 95&#x0025;. CNNs, used on image datasets, also demonstrated strong results, with accuracies ranging from 95&#x0025; to 99.61&#x0025;. Additionally, hybrid models like CNN-SVM and kernel clustering techniques enhanced detection accuracy and sensitivity. Overall, ML techniques, particularly ensemble methods and DL, exhibit robust potential for kidney disease detection.</p>
</sec>
<sec id="sec006">
<title>Breast Cancer</title>
<p>ML has been proposed by a number of medical researchers as a means of detecting breast cancer in its early stages. For instance, Miranda and Felipe<sup><xref ref-type="bibr" rid="ref31">31</xref></sup> developed fuzzy-logic-based computer-assisted identification techniques for breast cancer classification. Fuzzy logic is superior to other traditional ML techniques because it can replicate the expert radiologist&#x2019;s method and way of thinking while lowering computational costs. If the operator enters factors like contour, form, and density, the algorithm provides a classification of cancer depending on the user&#x2019;s selection. The accuracy was roughly 83.34&#x0025; based on the model that Miranda and Felipe<sup><xref ref-type="bibr" rid="ref31">31</xref></sup> proposed. The experiment&#x2019;s precision and fairness were improved by the authors&#x2019; usage of almost an equal ratio of photos. However, since the authors did not explore how the results were explained, it is possible to claim that the results among benign and malignant classifications is accurate in general. Moreover, there is no confusion matrix which shows the actual prediction of models for each of the given classes.</p>
<p>Using SVM and k-means clustering (KMC), Zheng et al.<sup><xref ref-type="bibr" rid="ref32">32</xref></sup> suggested hybrid methods for identifying breast cancer. Using the Wisconsin Diagnostic Breast Cancer (WDBC) dataset, their suggested model achieved a 97.38&#x0025; accuracy rate and significantly resolved the dimensional problem. The dataset has 32 variables organized into 10 categories and is regularly distributed. Applying their suggested model to a dataset with an uneven class distribution, where some items may be missing, makes it difficult to say that it will perform better.</p>
<p>Asri et al.<sup><xref ref-type="bibr" rid="ref33">33</xref></sup> employed a number of ML models, like SVM, DT (C4.5), NB, and KNN, with the WBC datasets in order to categorize the best ML models. With an accuracy of 97.13&#x0025;, the authors of the research demonstrated that SVM outperformed all other ML methods. However, the outcomes might be different if that same experiment is conducted on a different database. Furthermore, combining experimental findings from this work with ground truth values can provide a more precise indicator of the efficacy of a certain ML model.</p>
<p>Mohammed et al<sup><xref ref-type="bibr" rid="ref34">34</xref></sup> conducted an extremely similar investigation. In order to identify the most effective ML techniques, the authors used three algorithms: Classifiers are DT(J48), NB, and sequential minimal optimization (SMO). The data was gathered from two mostly used sets of data: WBC and breast cancer datasets. The second part is also interesting because the authors devoted special efforts to address the data imbalance problem and used data resampling labeling to alleviate it. However, their results have shown that the SMO algorithms perform better than the rest of the two classifiers to reach over 95&#x0025; precision in both datasets. However, many resampling methods were used to balance the imbalance ratio, so the probability of data variety may be also affected. As such, these three ML techniques have poor use when used on an uneven or non-normally distributed dataset. Assegie<sup><xref ref-type="bibr" rid="ref35">35</xref></sup> used the grid search method to obtain the ideal KNN model parameters. They then found out that the performance of the model was greatly affected by the parameter tuning. With a little tweaking, they found that we could get close to 94.35&#x0025; accuracy, as opposed to the default KNN of around 90&#x0025;.</p>
<p>Bhattacherjee et al.<sup><xref ref-type="bibr" rid="ref36">36</xref></sup> used a backpropagation neural network (BNN) to identify breast cancer. The WBC dataset with nine attributes yielded 99.27&#x0025; accuracy. Alshayeji et al.<sup><xref ref-type="bibr" rid="ref37">37</xref></sup> developed a shallow ANN to differentiate among types of breast cancer tumors using the WBCD and WDBI datasets. In doing so, the researchers showed that the proposed model could detect cancers with 99.85&#x0025; accuracy without changing the algorithms or choosing characteristics.</p>
<p>Sultana et al.<sup><xref ref-type="bibr" rid="ref38">38</xref></sup> used a different ANN architecture to detect breast cancer with the WBC dataset. The neural network (NN) models employed were modular neural networks (MNN), generalized feedforward neural networks (GFFNN), self-organizing feature maps (SOFM), multilayer perceptrons (MLP) neural networks, Jordan-Elman neural networks, recurrent neural networks (RNN), SVM neural networks, and probabilistic neural networks (PNN). According to their most recent computational results, the PNN outperformed the other neural network models utilized in that study with an accuracy of 98.24&#x0025;. However, in contrast to many other studies this work does not establish which traits are most important when it makes its predictions, making it less interpretable.</p>
<p>DL was also employed by Ghosh et al.<sup><xref ref-type="bibr" rid="ref39">39</xref></sup> In addition, the authors trained seven DL models, i.e. ANN, CNN, GRU, LSTM, MLP, PNN, and RNN, on the WBC dataset. We found that LSTM and GRU had the best performance out of all the DL models with accuracy reaching almost 99&#x0025;. A selection of studies that employs ML and DL techniques to diagnose breast cancer is included in <xref ref-type="table" rid="T3">Table 3</xref> below.</p>
<table-wrap id="T3">
<label>Table 3</label>
<caption>
<title>Comparison of Machine Learning Techniques in Breast Cancer Detection</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Study</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Algorithms Utilized</th>
<th valign="middle" align="left">Dataset Used</th>
<th valign="middle" align="left">Data Format</th>
<th valign="middle" align="left">Performance Metrics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">42</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">Na&#x00EF;ve Bayes, Bayesian network, RF, decision tree (C4.5)</td>
<td valign="middle" align="left">BCSC</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">Bayesian network achieved an ROC of 0.937.</td>
</tr>
<tr>
<td valign="middle" align="left">43</td>
<td valign="middle" align="left">2015</td>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">Mini-MIAS, INBreast</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">Mini-MIAS dataset results showed an accuracy of 99&#x0025; with an AUC of 0.9325.</td>
</tr>
<tr>
<td valign="middle" align="left">44</td>
<td valign="middle" align="left">2015</td>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">IRMA, DDSM</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">IRMA dataset achieved a sensitivity and specificity of 99&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">45</td>
<td valign="middle" align="left">2017</td>
<td valign="middle" align="left">Logistic regression-ANN</td>
<td valign="middle" align="left">156 proprietary cases</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">DDSM dataset achieved a sensitivity of 97&#x0025; and specificity of 96&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">46</td>
<td valign="middle" align="left">2016</td>
<td valign="middle" align="left">Binary logistic regression</td>
<td valign="middle" align="left">18 proprietary cases</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">Binary logistic regression achieved an accuracy of 81.8&#x0025; with an AUC of 0.855.</td>
</tr>
<tr>
<td valign="middle" align="left">47</td>
<td valign="middle" align="left">2015</td>
<td valign="middle" align="left">Na&#x00EF;ve Bayes, logistic regression with AdaBoost</td>
<td valign="middle" align="left">246 proprietary images</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">Logistic regression with AdaBoost achieved an accuracy of 80.39&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">40</td>
<td valign="middle" align="left">2024</td>
<td valign="middle" align="left">MLISBCP (K-Means SMOTE, Boruta)</td>
<td valign="middle" align="left">Breast cancer dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Proposed model reported sensitivity of 90&#x0025; and specificity of 97.5&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">41</td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">KNN (with PCA/SVD)</td>
<td valign="middle" align="left">Fine needle aspiration dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">KNN attained an accuracy of 97.53&#x0025;.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The risk of breast cancer is growing at an alarming rate, and Das et al.<sup><xref ref-type="bibr" rid="ref40">40</xref></sup> proposed an intelligent system, MLISBCP, to enhance breast cancer prediction. Class imbalance handling was done by using K-Means SMOTE and feature selection was done using Boruta in the system, with an accuracy of 97.53&#x0025;, better than the existing models. Furthermore, Shafique et al.<sup><xref ref-type="bibr" rid="ref41">41</xref></sup> concentrated on feature selection approaches to improve the prediction accuracy of breast cancer. In this regard, they had methods such as principal component analysis (PCA), singular vector decomposition (SVD), and chi-square, and tried several classifiers. However, the results of the group showed that using 15 features selected by PCA, KNN achieved perfect accuracy, demonstrating the promise of optimized feature sets and balanced datasets in enhancing prediction performance.</p>
<p>The studies on breast cancer detection using ML techniques demonstrate diverse approaches and strong performance across different datasets and algorithms. Models such as SVM achieved high accuracies, with the Mini-MIAS dataset showing 99&#x0025; accuracy and an AUC of 0.9325. Hybrid models like LR combined with ANN and Na&#x00EF;ve Bayes with AdaBoost achieved high sensitivity and specificity, with LR-ANN reaching 97&#x0025; sensitivity and 96&#x0025; specificity. The use of ensemble methods, like K-Means SMOTE with Boruta and KNN with PCA/SVD, also showed robust results, with sensitivity as high as 90&#x0025; and specificity of 97.5&#x0025;. Overall, ML models exhibit excellent potential for breast cancer detection, particularly with image and tabular data.</p>
</sec>
<sec id="sec007">
<title>Diabetes</title>
<p>The IDF estimates that more than 382 million people around the world have diabetes at the current moment and this number may rise to 629 million by 2045.<sup><xref ref-type="bibr" rid="ref48">48</xref></sup> Many studies have described the use of ML-based systems for identifying diabetes patients. For instance, Kandhasamy and Balamurali<sup><xref ref-type="bibr" rid="ref49">49</xref></sup> investigated the performance of the following ML classifiers for diagnosing patients with diabetes mellitus, namely J48 DT, KNN, RF, and SVM. The investigation was performed on the UCI diabetes dataset and KNN classifier with K = 1, and RF classifier performed with almost perfect accuracy. Nevertheless, there is one drawback in this work: the employed diabetes dataset was binary and had only eight attributes. Therefore, it is not a surprise that you get 100&#x0025; accuracy with a less complex dataset. Additionally, there is no explanation of how the algorithms affect the last prediction, and of how one should look at the result if they are not involved in technical matters in the experiment.</p>
<p>A Clinical Decision Support System (CDSS) was created by Yahyaoui et al.<sup><xref ref-type="bibr" rid="ref50">50</xref></sup> to assist doctors or practitioners in diagnosing diabetes. This study used a number of ML methods, including SVM, RF, and deep CNN, to accomplish this goal. RF yielded the best result in computations with an accuracy of 83.67&#x0025; compared with DL and SVM having 76.81&#x0025; and 65.38&#x0025;.</p>
<p>Naz and Ahuja<sup><xref ref-type="bibr" rid="ref48">48</xref></sup> used free-source PIMA diabetes datasets with the utilization of ANN, NB, DT, and DL in their study. DL method according to the authors of the study is effective in detecting the onset of diabetes with an accuracy of 98.07&#x0025; on average. PIMA is one of the most studied and basic datasets, which makes it easy to apply traditional and sophisticated ML algorithms. Thus, it is unsurprising that the PIMA Indian dataset has higher accuracy. Moreover, the article does not talk about the interpretability issues of the model and how the model can work with unbalanced data as well as when there are too many missing values. For example, the generated data in the healthcare industry may be of different types and not necessarily characterized, categorized, and already processed in the identical fashion as the PIMA Indian dataset. While it is important to assess the impartiality of algorithms, absence of bias, reliability, and interpretability in the second task, this article suggests that when developing a CDSS, all the more if working with a multiclass classification dataset where data is missing in large quantity, it is good to assess these characteristics.</p>
<p>Reasons include the presentation by Ashiquzzaman et al.<sup><xref ref-type="bibr" rid="ref51">51</xref></sup> of DL for overfitting handling in diabetes datasets. Using the PIMA Indian dataset, the proposed technique gave an accuracy of 88.41&#x0025;. The writers report that results were considerably enhanced when dropout strategies were implemented within the model and overfitting issues were duly eliminated. However, if we use the dropout technique too often, we spend an overall elevated amount of time training. It is hard to say if the suggested model for computational time will be the best one, as they did not take these factors into account in their analysis.</p>
<p>Alhassan et al.<sup><xref ref-type="bibr" rid="ref52">52</xref></sup> presented the King Abdullah International Research Center for Diabetes (KAIMRCD) dataset, the world&#x2019;s largest diabetic dataset with data from 14,000 individuals. In the experiment, the author&#x2019;s CDSS architecture achieved an accuracy of 97&#x0025; using LSTM- and GRU-based deep NN. <xref ref-type="table" rid="T4">Table 4</xref> gives a brief review of studies that used ML and DL techniques for diabetic diagnosis.</p>
<table-wrap id="T4">
<label>Table 4</label>
<caption>
<title>Comparison of Machine Learning Techniques in Diabetes Detection</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Study</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Algorithms Utilized</th>
<th valign="middle" align="left">Dataset Used</th>
<th valign="middle" align="left">Data Format</th>
<th valign="middle" align="left">Performance Metrics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">55</td>
<td valign="middle" align="left">2019</td>
<td valign="middle" align="left">Dirichlet Process Mixture (DPM)</td>
<td valign="middle" align="left">Proprietary dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">DPM achieved an accuracy of 96.74&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">56</td>
<td valign="middle" align="left">2021</td>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">DIABIM-MUNE</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">RF reported an AUC of 0.80.</td>
</tr>
<tr>
<td valign="middle" align="left">57</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">KNN</td>
<td valign="middle" align="left">Proprietary dataset (4900 samples)</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">KNN attained an accuracy of 99.9&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">58</td>
<td valign="middle" align="left">2018</td>
<td valign="middle" align="left">SVM, Decision tree, ANN, logistic Regression</td>
<td valign="middle" align="left">Proprietary dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">SVM demonstrated an accuracy of 79.5&#x0025; with an AUC of 0.839.</td>
</tr>
<tr>
<td valign="middle" align="left">59</td>
<td valign="middle" align="left">2021</td>
<td valign="middle" align="left">PSO, MLPNN</td>
<td valign="middle" align="left">Proprietary dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">PSO achieved an accuracy of 98.73&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">53</td>
<td valign="middle" align="left">2022</td>
<td valign="middle" align="left">KNN, Na&#x00EF;ve Bayes</td>
<td valign="middle" align="left">Diabetes dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Na&#x00EF;ve Bayes outperformed KNN in accuracy.</td>
</tr>
<tr>
<td valign="middle" align="left">54</td>
<td valign="middle" align="left">2024</td>
<td valign="middle" align="left">Logistic regression, SVM, Na&#x00EF;ve Bayes, RF, XGBoost, LightGBM, CatBoost, AdaBoost, Bagging</td>
<td valign="middle" align="left">Kaggle Diabetes dataset</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">CatBoost achieved an accuracy of 95.4&#x0025; and an AUC-ROC of 0.99.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>ML for diabetes prediction was explored by Febrian et al,<sup><xref ref-type="bibr" rid="ref53">53</xref></sup> where the KNN and Na&#x00EF;ve Bayes were compared. They evaluated the confusion matrix for diabetes prediction using health attributes and found that Na&#x00EF;ve Bayes significantly beats out KNN. Moreover, Modak and Jha,<sup><xref ref-type="bibr" rid="ref54">54</xref></sup> developed an innovative diabetes prediction model using several ML techniques, including LR, SVM, Na&#x00EF;ve Bayes, and RF. They enhanced the model with ensemble methods such as XGBoost, LightGBM, CatBoost, AdaBoost, and Bagging. Among these, CatBoost achieved the highest accuracy of 95.4&#x0025;, outperforming XGBoost, and demonstrated a superior AUC-ROC score of 0.99, showcasing its potential for more accurate diabetes forecasting.</p>
<p>The studies on diabetes detection using ML techniques show a variety of models and strong performance across different datasets. The Dirichlet Process Mixture (DPM) achieved an impressive accuracy of 96.74&#x0025;, while RF reported an AUC of 0.80 on the DIABIM-MUNE dataset. KNN demonstrated high accuracy, reaching 99.9&#x0025; on a proprietary dataset, while SVM achieved 79.5&#x0025; accuracy with an AUC of 0.839. The particle-swarm-optimization-based MLP neural network (PSO-MLPNN) model reached an accuracy of 98.73&#x0025;. Additionally, models like Na&#x00EF;ve Bayes outperformed KNN in accuracy, and the more recent study using a range of algorithms on the Kaggle diabetes dataset saw CatBoost achieving 95.4&#x0025; accuracy and an AUC-ROC of 0.99, showcasing the potential of ensemble methods and advanced models for diabetes detection.</p>
</sec>
<sec id="sec008">
<title>COVID-19</title>
<p>The most significant problem of the century is the highly contagious illness linked to the novel severe acute respiratory syndrome coronavirus 2 (SARS-CoV-2), sometimes referred to as COVID-19. Normally people did not have access to the vaccine throughout the crisis, despite the fact that it was being provided because of the worldwide pandemic.<sup><xref ref-type="bibr" rid="ref60">60</xref></sup> The high transmissibility and vaccine resistance of the novel COVID-19 Omicron strain are additional causes for concern. The real-time reverse transcription-polymerase chain reaction (RT-PCR) is currently the gold standard for diagnosing COVID-19 infection.<sup><xref ref-type="bibr" rid="ref61">61</xref></sup> The researcher suggested more so that ML and AI can be employed together with more sophisticated tools such as X-ray and CT scan to detect individuals who might be susceptible to the outbreak. For instance, Chen et al.<sup><xref ref-type="bibr" rid="ref62">62</xref></sup> suggested a UNet&#x002B;&#x002B; model with CT images from 51 COVID-19 and 82 non-COVID-19 patients, with their accuracy being 98.5&#x0025;. Abbasian et al<sup><xref ref-type="bibr" rid="ref63">63</xref></sup> compare the performance of 10 distinct DL models using a tiny dataset of 108 and 86 COVID and non-COVID respectively, achieving an overall accuracy of 99&#x0025;. It is Wang et al.<sup><xref ref-type="bibr" rid="ref64">64</xref></sup> who developed an inception-based model using a ton of data and 453 CT scan pictures in order to achieve 73.1&#x0025; accuracy. Unfortunately, the region of interest (ROI) and network activity of the model were not well defined. The COVNet model was presented by Lin et al.<sup><xref ref-type="bibr" rid="ref65">65</xref></sup> using a large dataset of 4356 positive chest CT images of pneumonia patients and 1296 positive chest CT images of COVID-19 patients, with an accuracy of 96&#x0025;.</p>
<p>At the same time, several reports came to recommend using chest X-ray pictures for COVID screening (such as those by Lababidi et al., Khoudour et al., and Narin et al.<sup><xref ref-type="bibr" rid="ref66">66</xref>&#x2013;<xref ref-type="bibr" rid="ref68">68</xref></sup>). Additionally, the other studies made use of larger datasets in order to produce more sophisticated screening methods. For the purposes of the current research, Brunese et al.<sup><xref ref-type="bibr" rid="ref69">69</xref></sup> used 6505 scans with a 1:1.17 data ratio, of which 3520 were classified as &#x201C;other patients&#x201D; and 3003 as COVID-19 symptoms. Ghoshal and Tucker<sup><xref ref-type="bibr" rid="ref70">70</xref></sup> obtained 92.9&#x0025; accuracy with a dataset of 5941 images. None of the two studies considered the issue of how the proposed models would perform when presented with data that is skewed and has different class distributions. Apostolopoulos and Mpesiana<sup><xref ref-type="bibr" rid="ref71">71</xref></sup> employed a convolutional-neural-network-based Xception model on a dataset of COVID-19 and non-COVID-19 cases. The dataset included chest X-ray scans of 284 COVID-19 and 967 non-COVID-19 patients, with an average accuracy of 89.6&#x0025;.</p>
<p>Solayman et al.<sup><xref ref-type="bibr" rid="ref72">72</xref></sup> developed an ML-based intelligent web application for COVID-19 detection, using techniques such as LR, RF, DT, k-nearest neighbor, SVM, ensemble models (AdaBoost, XGBoost), and DL (artificial neural network, CNN, LSTM). They applied the SMOTE technique for data balancing and the LIME framework for explainable AI, with the hybrid CNN-LSTM model achieving 96.34&#x0025; accuracy and a 0.98 F1 score on a dataset obtained from the Israeli Ministry of Health. Moreover, Nanehkaran et al.<sup><xref ref-type="bibr" rid="ref73">73</xref></sup> focused on predicting the environmental impact of pandemic plastics using a DNN model. Their study used data from February 2020 to October 2021 on COVID-19 spread and PPE usage, with the DNN model outperforming other algorithms like KNN, DT, and RFs, achieving an AUC of 0.929 and lower error rates (MSE = 0.024, RMSE &#x003D; 0.027).</p>
<p>In <xref ref-type="table" rid="T5">Table 5</xref> below, the present study identified some of the works that utilized ML and DL techniques to diagnose COVID-19.</p>
<table-wrap id="T5">
<label>Table 5</label>
<caption>
<title>Comparison of Machine Learning Techniques in Heart Disease Detection</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Study</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Algorithms Utilized</th>
<th valign="middle" align="left">Dataset Used</th>
<th valign="middle" align="left">Data Format</th>
<th valign="middle" align="left">Performance Metrics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">65</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Mixed dataset</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">CNN achieved an accuracy of 90&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">62</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Mixed dataset</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">CNN reported an accuracy of 98.5&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">74</td>
<td valign="middle" align="left">2021</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Mixed dataset</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">CNN attained an accuracy of 86&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">75</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Cohen&#x2019;s dataset</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">CNN achieved an accuracy of 94.1&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">76</td>
<td valign="middle" align="left">2020</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Cohen&#x2019;s dataset</td>
<td valign="middle" align="left">Image and Tabular</td>
<td valign="middle" align="left">CNN demonstrated an accuracy of 95.38&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">72</td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">Logistic regression, RF, decision tree, KNN, SVM, AdaBoost, XGBoost, CNN, LSTM</td>
<td valign="middle" align="left">COVID-19 symptoms dataset (Israeli Ministry of Health)</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Highest accuracy was achieved 96.34&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">73</td>
<td valign="middle" align="left">2023</td>
<td valign="middle" align="left">Deep neural network (DNN), KNN, decision tree, RF, SVM, Gaussian Na&#x00EF;ve Bayes, logistic regression, multilayer perceptron</td>
<td valign="middle" align="left">COVID-19 spread and PPE usage data (Iran)</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">Highest accuracy was achieved 0.929.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The studies on COVID-19 detection using ML techniques highlight the strong performance of CNN across various datasets, with accuracy values ranging from 86&#x0025; to 98.5&#x0025;. Notably, CNN models demonstrated accuracy of 94.1&#x0025; and 95.38&#x0025; on Cohen&#x2019;s dataset, and 90&#x0025; on a mixed dataset. Additionally, a combination of models like LR, RF, DT, KNN, SVM, AdaBoost, XGBoost, CNN, and long short-term memory (LSTM) achieved a high accuracy of 96.34&#x0025; on a COVID-19 symptoms dataset. Another study employing a variety of models on COVID-19 spread and PPE usage data reported an accuracy of 92.9&#x0025;, demonstrating the effectiveness of DL and traditional ML models for detecting and analyzing COVID-19.</p>
</sec>
<sec id="sec009">
<title>Other Diseases</title>
<p>Both ML and DL have been used to detect diseases other than the ones listed above. There are two key causes for this rising application: big data and the progress in computer hardware. For example, Mao et al used eye movement to classify diseases using DT and RF.<sup><xref ref-type="bibr" rid="ref77">77</xref></sup> When designing automatic skin disease categorization systems, Nosseir and Shawky<sup><xref ref-type="bibr" rid="ref78">78</xref></sup> compared KNN with SVM; KNN performed best, with an accuracy of 98.22&#x0025;. Khan et al.<sup><xref ref-type="bibr" rid="ref79">79</xref></sup> classified multimodal brain cancers using CNN-based models such as VGG16 and VGG19. Three publicly accessible image datasets were used in the experiment: Specifically, the proposed method achieved an accuracy of 97.8&#x0025;, 96.9&#x0025;, and 92.5&#x0025; when submitted to BraTs2015, BraTs2017, and BraTs2018. Similar work was done by Imran et al.,<sup><xref ref-type="bibr" rid="ref28">28</xref></sup> who used the RF classifier for tumor segmentation. Using the datasets BRATS 2012, BRATS 2013, BRATS 2014, BRATS 2015, and ISLES 2015, the authors obtained overall accuracy of 98.7&#x0025;, 98.7&#x0025;, 98.4&#x0025;, 90.2&#x0025;, and 90.2&#x0025;, respectively.<sup><xref ref-type="bibr" rid="ref80">80</xref></sup></p>
<p>Dai et al.<sup><xref ref-type="bibr" rid="ref81">81</xref></sup> developed a CNN for the development of an application for the detection of skin cancer. Using the publicly available HAM10000 dataset, the authors experiment and achieve an accuracy of 75.2&#x0025;. In 2020, in their work Dai et al.<sup><xref ref-type="bibr" rid="ref81">81</xref></sup> used KNN, SVM, CNN, and majority voting to identify melanoma skin cancer using the ISIC dataset. At 88.4&#x0025; majority voting achieved the highest accuracy. A list of some of the literature reviewed in this study using ML and DL in disease diagnosis is presented in <xref ref-type="table" rid="T6">Table 6</xref>.</p>
<table-wrap id="T6">
<label>Table 6</label>
<caption>
<title>Comparison of Machine Learning Techniques in Various Disease Detection</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Study</th>
<th valign="middle" align="left">Year</th>
<th valign="middle" align="left">Algorithms Utilized</th>
<th valign="middle" align="left">Dataset Used</th>
<th valign="middle" align="left">Data Format</th>
<th valign="middle" align="left">Performance Metrics</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">82</td>
<td valign="middle" align="left">Classification of pediatric colonic inflammatory bowel disease</td>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">74 proprietary cases</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">RF achieved an accuracy of 100&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">83</td>
<td valign="middle" align="left">Liver disease classification</td>
<td valign="middle" align="left">SVM</td>
<td valign="middle" align="left">ILPD, BUPA</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">SVM reported an accuracy of 90&#x0025;&#x2013;92&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">84</td>
<td valign="middle" align="left">Brain tumor diagnosis</td>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">Brain tumor challenge sites and MRI</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">CNN demonstrated an accuracy range of 90&#x0025;&#x2013;99&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">85</td>
<td valign="middle" align="left">Brain tumor segmentation</td>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">MICCAI, BraTS 2013</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">RF achieved an 88&#x0025; Dice overlap.</td>
</tr>
<tr>
<td valign="middle" align="left">86</td>
<td valign="middle" align="left">Melanoma detection using dermoscopic images</td>
<td valign="middle" align="left">SVM with color and feature extraction</td>
<td valign="middle" align="left">PH2</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">SVM attained an accuracy of 96&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">87</td>
<td valign="middle" align="left">Melanoma skin cancer detection</td>
<td valign="middle" align="left">Na&#x00EF;ve Bayes, decision tree, KNN</td>
<td valign="middle" align="left">MED-NODE</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">A decision tree classifier reported an accuracy of 82.35&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">88</td>
<td valign="middle" align="left">Skin cancer detection with thermal imaging</td>
<td valign="middle" align="left">EL and DL</td>
<td valign="middle" align="left">CSLTAD</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">EL achieved a precision of 0.9665.</td>
</tr>
<tr>
<td valign="middle" align="left">89</td>
<td valign="middle" align="left">Hepatocellular carcinoma detection</td>
<td valign="middle" align="left">InceptionV3</td>
<td valign="middle" align="left">Genomic Data Commons</td>
<td valign="middle" align="left">Image</td>
<td valign="middle" align="left">InceptionV3 reported an accuracy of 89&#x0025;&#x2013;96&#x0025;.</td>
</tr>
<tr>
<td valign="middle" align="left">90</td>
<td valign="middle" align="left">Prediction of HCC postoperative death outcomes</td>
<td valign="middle" align="left">RF, gradient boosting, GBM, logistic regression, decision tree</td>
<td valign="middle" align="left">BioStudies database</td>
<td valign="middle" align="left">Tabular</td>
<td valign="middle" align="left">A random forest model demonstrated an AUC of 0.803.</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The studies on various disease detection using ML techniques show a diverse range of successful applications. For pediatric colonic inflammatory bowel disease, RF achieved 100&#x0025; accuracy. In liver disease classification, SVM demonstrated accuracy between 90&#x0025; and 92&#x0025;. For brain tumor diagnosis, CNN achieved accuracies between 90&#x0025; and 99&#x0025;, while RF performed well in brain tumor segmentation with an 88&#x0025; Dice overlap. In melanoma detection, SVM with feature extraction achieved 96&#x0025; accuracy, and DT reported 82.35&#x0025; for skin cancer detection. Thermal imaging for skin cancer showed a precision of 0.9665 with EL. In hepatocellular carcinoma (HCC) detection, InceptionV3 reported accuracy between 89&#x0025; and 96&#x0025;, while RF models demonstrated an AUC of 0.803 for predicting HCC postoperative death outcomes, indicating the wide applicability and success of ML techniques in medical diagnostics.</p>
</sec>
<sec id="sec010" sec-type="discussion">
<title>Discussion</title>
<p>A significant reliance on ML, EL, and DL models is found in the literature to perform disease classification across diverse medical datasets as shown in <xref ref-type="fig" rid="F2">Figure 2</xref>. These ML models (RF and SVM) are employed as they have proved to deliver robust performance on image as well as tabular datasets, as evident in studies of Dhaliwal et al.,<sup><xref ref-type="bibr" rid="ref82">82</xref></sup> Waheed et al.,<sup><xref ref-type="bibr" rid="ref86">86</xref></sup> and Wang et al.,<sup><xref ref-type="bibr" rid="ref90">90</xref></sup> which showed that EL techniques like gradient boosting and AdaBoost can combine many weak learners into a more reliable and accurate predictor. For image-based diagnosis tasks like brain tumor detection<sup><xref ref-type="bibr" rid="ref84">84</xref></sup> and melanoma classification,<sup><xref ref-type="bibr" rid="ref88">88</xref></sup> CNNs are often used as DL models to extract the best characteristics from complex data. The reason these methods are widely adopted is that they have been shown to enhance diagnostic accuracy and to cope with different data formats and complexities.</p>
<fig id="F2" position="float">
<object-id pub-id-type="doi">10.70389/journal.pjs.100043.g002</object-id>
<label>Fig 2</label>
<caption><title>Distribution of models among the studies</title>
</caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/05/pjs-24-579-Figure-2.jpg">Figure 2</ext-link></p>
</fig>
<p>It also describes how the choice of algorithm is strategically constrained by disease dynamics and data properties. Due to excellent high accuracy, ML models are dominating breast cancer detection<sup><xref ref-type="bibr" rid="ref41">41</xref></sup> and heart disease classification<sup><xref ref-type="bibr" rid="ref13">13</xref></sup> owing to their capability to work well with structured tabular data. For the medical prediction of diseases like diabetes,<sup><xref ref-type="bibr" rid="ref54">54</xref></sup> and liver cancer,<sup><xref ref-type="bibr" rid="ref90">90</xref></sup> one of the EL techniques, gradient boosting and RF are often used due to the reliability in prediction by combining multiple models. Because CNNs, a subset of DL models, are capable of obtaining important characteristics from high-dimensional image data, they are chosen for imagery-focused tasks like COVID-19 detection<sup><xref ref-type="bibr" rid="ref72">72</xref></sup> and brain tumor diagnosis.<sup><xref ref-type="bibr" rid="ref84">84</xref></sup> The disease-specific requirements and the strengths of each algorithm type were aligned when selecting models to suit the diversity of diagnostic applications without diminishing performance. The mapping of diseases and models is shown in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<object-id pub-id-type="doi">10.70389/journal.pjs.100043.g003</object-id>
<label>Fig 3</label>
<caption><title>Disease and model mapping</title>
</caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/05/pjs-24-579-Figure-3.jpg">Figure 3</ext-link></p>
</fig>
<p>Computational models evolved over the years and are increasingly being adopted and improved for medical diagnosis and prediction tasks as shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. From 2015 to 2016 though, the simplicity and effectiveness of tabular and image data made the landscape dominated by ML models like LR, SVM,<sup><xref ref-type="bibr" rid="ref43">43</xref></sup> etc. In 2017 and 2018, there has been a rapid increase in the usage of DL models (e.g., CNNs),<sup><xref ref-type="bibr" rid="ref45">45</xref></sup> thanks to the increasing availability of computational power and medical imaging data. Due to this, by 2019-2020, ensemble learning (EL) techniques, which include RF and gradient boosting,<sup><xref ref-type="bibr" rid="ref57">57</xref></sup> became popular aligners with higher prediction accuracy through model aggregation; and DL models for fast integration of tasks that need complex feature extraction in the diagnosis of brain tumor.<sup><xref ref-type="bibr" rid="ref84">84</xref></sup> The model types for all three models exponentially grew between 2021 and 2022, aided by more diverse data and hybrid approaches.<sup><xref ref-type="bibr" rid="ref72">72</xref></sup> The period from 2023 to 2024 has seen a significant increase in the adoption of deep learning (DL) and ensemble learning (EL) methods. For example, research has highlighted the effectiveness of the CatBoost algorithm in predicting diabetes, and a hybrid model combining Convolutional Neural Networks (CNN) and Long Short-Term Memory (LSTM) networks has shown promise in detecting COVID-19; this explains the move from much easier and less moil category of methods for medical analytics to more advanced and data exclusive.</p>
<fig id="F4" position="float">
<object-id pub-id-type="doi">10.70389/journal.pjs.100043.g004</object-id>
<label>Fig 4</label>
<caption><title>Evolution of models in early disease detection</title>
</caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/05/pjs-24-579-Figure-4.jpg">Figure 4</ext-link></p>
</fig>
</sec>
<sec id="sec011">
<title>Challenges and Opportunities in Early Disease Detection</title>
<p>A tide of potential healthcare advancement comes with incorporating ML into early disease detection. However, it is also a challenging environment that goes beyond technical complexities. When embarking on the exciting path of leveraging predictive power for detecting diseases at an early stage, we must acknowledge the ethical and technical foundations on which this transformation rests. Sensitivities in the healthcare industry revolve around personal and medical data, which constitute highly sensitive medical information. Secure data storage, transmission, and access controls are necessary to protect patient privacy. A long-standing challenge is to strike an equilibrium between the use of data for early detection models and the protection of patient privacy.<sup><xref ref-type="bibr" rid="ref91">91</xref></sup></p>
<p>Before using patient data in predictive models, we must have consent. A key aspect of establishing trust between patients and healthcare providers involves transparent communication of what data might be used for, potential hazards associated as well as potential benefits. When training models of ML on historical data, any inherent biases in that data can be unconsciously learned by those models. This can lead to unfair predictions that have been shown to disproportionately affect members of certain demographic groups. Eliminating bias and achieving fairness in predictive models are critical for achieving equitable healthcare outcomes. Since ML models tend to be increasingly elaborate, they have a tendency to turn into something like &#x201C;black boxes&#x201D; and it is often hard to understand how exactly they come to make these predictions. If models are not explicable and comprehensible<sup><xref ref-type="bibr" rid="ref92">92</xref></sup> then healthcare professionals will not be able to rely on and act upon their predictions.</p>
<p>The integration of ML into healthcare workflows might remain a cause for concern in the case of inaccurate predictions and whether an entity should be accountable for if and when incorrect predictions are made. It is difficult to determine responsibility and set up rules for corrective actions in these situations. How representative and good the training data is, determines how precise the predictive models will be. In addition, erroneous or insufficient data often leads to inaccurate predictions. Therefore, thorough data preprocessing and duration for getting the prediction are required. However, to validate that predictive models are dependable and generalizable, they must be validated on diverse and independent datasets. A technical issue to be solved is the problem of overfitting, which occurs when a model trains well on the training data, but poorly on new data.</p>
<p>Certain ML methods are too complicated to use in medical environments. In order to build trust, models need to be developed that generate interpretable insights so that healthcare professionals can understand the reasoning behind predictions. Integrating predictive models into current clinical workflows is a technical challenge. To be integrated seamlessly, it has to be compatible with electronic health records, imaging systems, and other healthcare technologies. Since healthcare data is becoming larger and larger, predictive models need to be scalable to process a large dataset efficiently. Models are still effective as the volume of data increases, due to scalability. This is a technical challenge when real-time predictions are needed and predictive models need to rapidly process data and are able to produce practical insights in a timely fashion. Multiple stakeholders need to collaborate to steer the intersection of ethical and technical considerations in the predictive detection of diseases.<sup><xref ref-type="bibr" rid="ref93">93</xref></sup> Only multidisciplinary teams including healthcare professionals working with data scientists, ethicists, legal experts, and policymakers can design ethical guidelines and structures. ML holds enormous potential to revolutionize the healthcare industry through predictive disease detection. Yet the voyage is beset with ethical and technical hurdles that have to be surmounted in order for a responsible, equitable implementation. Not only is it necessary for successful adoption, but it is also necessary to strike the right balance between improving technology and keeping ethical values in order to get the maximum benefits from predictive power and the minimum associated risks (<xref ref-type="table" rid="T7">Table 7</xref>).</p>
<table-wrap id="T7">
<label>Table 7</label>
<caption>
<title>Summary of Challenges and Solutions</title>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th valign="middle" align="left">Aspect</th>
<th valign="middle" align="left">Challenges</th>
<th valign="middle" align="left">Solutions/Considerations</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="left">Data Privacy and Security</td>
<td valign="middle" align="left">Sensitive personal and medical data require secure storage, transmission, and access controls to protect patient privacy.</td>
<td valign="middle" align="left">Ensure consent before using patient data; Implement strong security measures to protect data; Develop transparent communication strategies with patients about data usage and potential risks/benefits.</td>
</tr>
<tr>
<td valign="middle" align="left">Bias in Data</td>
<td valign="middle" align="left">Machine learning models may inherit biases from historical data, leading to unfair predictions and disproportionately affecting certain demographic groups.</td>
<td valign="middle" align="left">Eliminate biases and ensure fairness in models; Regularly audit models for discriminatory outcomes.</td>
</tr>
<tr>
<td valign="middle" align="left">Model Explainability</td>
<td valign="middle" align="left">Complex models may act as &#x201C;black boxes,&#x201D; making it hard for healthcare professionals to understand how predictions are made, affecting trust and reliability.</td>
<td valign="middle" align="left">Develop interpretable models that provide clear explanations for predictions; Ensure healthcare professionals can act on the model&#x2019;s insights.</td>
</tr>
<tr>
<td valign="middle" align="left">Accountability for Inaccurate Predictions</td>
<td valign="middle" align="left">Uncertainty about who is responsible for incorrect predictions and the corrective actions needed.</td>
<td valign="middle" align="left">Establish clear accountability rules; Define corrective actions for incorrect predictions; Ensure reliable and accurate data is used for model training.</td>
</tr>
<tr>
<td valign="middle" align="left">Data Quality and Preprocessing</td>
<td valign="middle" align="left">Erroneous or insufficient data can lead to inaccurate predictions, making data preprocessing and model validation essential.</td>
<td valign="middle" align="left">Ensure high-quality, diverse data is used for training; Perform thorough data preprocessing; Validate models using independent datasets to improve accuracy and generalizability.</td>
</tr>
<tr>
<td valign="middle" align="left">Overfitting</td>
<td valign="middle" align="left">Overfitting occurs when models perform well on training data but poorly on new, unseen data.</td>
<td valign="middle" align="left">Regularize models, use cross-validation techniques, and ensure diverse datasets to prevent overfitting.</td>
</tr>
<tr>
<td valign="middle" align="left">Model Complexity and Usability</td>
<td valign="middle" align="left">Some machine learning methods are too complex for use in medical environments, affecting adoption and trust.</td>
<td valign="middle" align="left">Develop simpler, interpretable models that generate understandable insights for healthcare professionals.</td>
</tr>
<tr>
<td valign="middle" align="left">Integration into Clinical Workflows</td>
<td valign="middle" align="left">Integrating predictive models into existing healthcare technologies like electronic health records and imaging systems is a technical challenge.</td>
<td valign="middle" align="left">Ensure models are compatible with current systems; Work with healthcare professionals to streamline integration into daily clinical workflows.</td>
</tr>
<tr>
<td valign="middle" align="left">Scalability</td>
<td valign="middle" align="left">Predictive models need to efficiently process large datasets, particularly as healthcare data continues to grow.</td>
<td valign="middle" align="left">Design scalable models that can handle increasing volumes of data without compromising speed or accuracy.</td>
</tr>
<tr>
<td valign="middle" align="left">Real-Time Predictions</td>
<td valign="middle" align="left">Real-time predictions require models that can process data quickly and deliver practical insights in a timely manner.</td>
<td valign="middle" align="left">Optimize models for real-time prediction and response, ensuring low latency for time-sensitive decision-making.</td>
</tr>
<tr>
<td valign="middle" align="left">Multidisciplinary Collaboration</td>
<td valign="middle" align="left">Developing ethical and technical guidelines requires input from multiple stakeholders, including healthcare professionals, data scientists, ethicists, legal experts, and policymakers.</td>
<td valign="middle" align="left">Encourage collaboration across disciplines to create comprehensive ethical frameworks and technical solutions for responsible predictive disease detection.</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec012">
<title>A Glimpse into the Future: Emerging Trends and Prospects in Machine-Learning-Driven Early Disease Diagnostics</title>
<p>The application of ML to early disease detection has led to significant healthcare advances, but the road ahead is promising. As technology and our understanding of diseases advance, ML-based early disease detection appears to be on the brink of an emerging trend that could shape the future of healthcare. These trends have the potential to revitalize the healthcare system while improving our capacity to identify diseases early on. Predictive model optimization will require the integration of data from multiple sources, such as wearable technologies, medical imaging, genomic data, and electronic health records. A more accurate and detailed picture of a patient&#x2019;s health status will be provided by ML algorithms that integrate many data modalities, such as test results, radiological images, prescription drugs, and vital signs. The need for model interpretability is growing as ML models get more intricate. The rise of explainable AI, which seeks to create algorithms that can provide an explanation for their predictions, allays this worry. Gaining the trust of medical experts and empowering them to base their decisions on the algorithmically offered insights will depend on this. Transfer learning is the process of training ML models for some conditions and then using what they have learned to identify other diseases that are similar. The versatility of this approach enables models created for one disease to be altered for the early diagnosis of related diseases, boosting output and speeding up model development.<sup><xref ref-type="bibr" rid="ref94">94</xref></sup></p>
<p>There is an abundance of gadgets, and ongoing health monitoring, as a result of which ML algorithms can now predict and issue real-time alerts. This also benefits both patients and medical professionals by giving them timely notification about upcoming health issues so prompt treatment and prevention can take place. Although quantum computing is still in its infancy, the impact on the healthcare sector will be huge. The consequent processing power of this could help the training of and tinkering around with complex ML models, ultimately speeding and refining the process of disease diagnosis. ML is capable of analyzing large datasets and can help to build precision medical strategies. Predictive models combine panoply into an individual&#x2019;s genetic fingerprint, lifestyle, and medical history to inform the development of personalized treatment plans.<sup><xref ref-type="bibr" rid="ref95">95</xref></sup></p>
</sec>
<sec id="sec013">
<title>Applications of LLMs in Early Disease Detection</title>
<p>The integration of large language models (LLMs) in early disease detection offers significant promise, particularly in handling unstructured healthcare data such as clinical notes, medical literature, and patient records. LLMs can process and analyze vast amounts of text data to identify patterns, correlations, and risk factors that might otherwise go unnoticed.<sup><xref ref-type="bibr" rid="ref96">96</xref></sup> By leveraging their ability to understand context and draw inferences from natural language, LLMs can assist healthcare professionals in diagnosing diseases at earlier stages by providing insights into a patient&#x2019;s medical history, symptoms, and potential risk factors. Additionally, LLMs can enhance decision support systems by synthesizing research findings and clinical guidelines, helping doctors make more informed, data-driven decisions.<sup><xref ref-type="bibr" rid="ref97">97</xref></sup></p>
<p>Furthermore, LLMs can be instrumental in analyzing and predicting trends in disease outbreaks or patient health conditions. Their ability to continuously learn from diverse datasets, including patient reports and scientific publications, enables them to track emerging patterns in disease progression or responses to treatment.<sup><xref ref-type="bibr" rid="ref98">98</xref></sup> For example, LLMs can assist in identifying early warning signs for conditions like cancer, cardiovascular diseases, or neurological disorders by analyzing subtle language cues from patient interactions and medical histories. Their adaptability allows for real-time updates on disease trends, which could lead to more timely interventions. Ultimately, the application of LLMs in early disease detection not only augments the capabilities of medical professionals but also represents a transformative shift towards more proactive, predictive, and personalized healthcare.</p>
</sec>
<sec id="sec014" sec-type="conclusions">
<title>Conclusion</title>
<p>This study underscores the significant impact of ML, EL, and DL models in early disease detection, with ML models being the most widely applied across various healthcare domains. The findings highlight the evolution of these models from simpler ML techniques to more sophisticated DL and ensemble approaches, demonstrating the increasing capacity to handle complex medical data and enhance diagnostic precision. However, challenges remain, particularly in areas such as data privacy, model interpretability, and the integration of these technologies into clinical workflows. Despite these obstacles, the study emphasizes how emerging trends and continuous advancements in AI-driven models hold the transformative potential to revolutionize early disease detection. This could lead to more proactive and personalized healthcare, ultimately improving patient outcomes, reducing healthcare costs, and advancing healthcare equity by providing better access to accurate diagnostic tools. As these technologies evolve, they will not only benefit the medical community but also have a profound societal impact by ensuring that earlier, more accurate diagnoses contribute to better overall health outcomes for individuals and communities.</p>
</sec>
</body>
<back>
<fn-group>
<fn id="n1" fn-type="other">
<p>Additional material is published online only. To view please visit the journal online.</p>
<p><bold>Cite this as</bold>: Manzoor MF. Machine Learning for Early Disease Diagnosis: A Review of Techniques in Healthcare Applications. Premier Journal of Science 2025;5:100043</p>
<p><bold>DOI</bold>: https://doi.org/10.70389/PJS.100043</p>
</fn>
<fn id="n2" fn-type="other">
<p><bold>Ethical approval</bold></p>
<p>N/a</p>
</fn>
<fn id="n3" fn-type="other">
<p><bold>Consent</bold></p>
<p>N/a</p>
</fn>
<fn id="n4" fn-type="other">
<p><bold>Funding</bold></p>
<p>No industry funding.</p>
</fn>
</fn-group>
<fn-group>
<fn id="n5" fn-type="conflict">
<p><bold>Conflicts of interest</bold></p>
<p>N/a</p>
</fn>
<fn id="n6" fn-type="other">
<p><bold>Author contribution</bold></p>
<p>Muhammad Faraz Manzoor &#x2013; Conceptualization, Writing &#x2013; original draft, review and editing</p>
</fn>
<fn id="n7" fn-type="other">
<p><bold>Guarantor</bold></p>
<p>Muhammad Faraz Manzoor</p>
</fn>
<fn id="n8" fn-type="other">
<p><bold>Provenance and peer-review</bold></p>
<p>Commissioned and externally peer-reviewed</p>
</fn>
<fn id="n9" fn-type="other">
<p><bold>Data availability statement</bold></p>
<p>N/a</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1</label><mixed-citation publication-type="journal"><string-name><surname>Knights</surname> <given-names>D</given-names></string-name>, <string-name><surname>Parfrey</surname> <given-names>LW</given-names></string-name>, <string-name><surname>Zaneveld</surname> <given-names>J</given-names></string-name>, <string-name><surname>Lozupone</surname> <given-names>C</given-names></string-name>, <string-name><surname>Knight</surname> <given-names>R</given-names></string-name>. <article-title>Human-associated microbial signatures: examining their predictive value</article-title>. <source>Cell Host Microbe</source>. <year>2011</year>;<volume>10</volume>(<issue>4</issue>):<fpage>292</fpage>&#x2013;<lpage>6</lpage>.</mixed-citation></ref>
<ref id="ref2"><label>2</label><mixed-citation publication-type="journal"><string-name><surname>Krueger</surname> <given-names>C</given-names></string-name>, <string-name><surname>Bini</surname> <given-names>S</given-names></string-name>, <string-name><surname>Helm</surname> <given-names>JM</given-names></string-name>, <string-name><surname>Swiergosz</surname> <given-names>AM</given-names></string-name>, <string-name><surname>Haeberle</surname> <given-names>HS</given-names></string-name>, <string-name><surname>Karnuta</surname> <given-names>JM</given-names></string-name>, <etal>et al.</etal> <article-title>Machine learning and artificial intelligence: definitions, applications, and future directions</article-title>. <source>Curr Rev Musculoskelet Med</source>. <year>2020</year>;<volume>13</volume>(<issue>1</issue>):<fpage>69</fpage>&#x2013;<lpage>76</lpage>.</mixed-citation></ref>
<ref id="ref3"><label>3</label><mixed-citation publication-type="journal"><string-name><surname>Campos</surname> <given-names>TL</given-names></string-name>, <string-name><surname>Korhonen</surname> <given-names>PK</given-names></string-name>, <string-name><surname>Hofmann</surname> <given-names>A</given-names></string-name>, <string-name><surname>Gasser</surname> <given-names>RB</given-names></string-name>, <string-name><surname>Young</surname> <given-names>ND</given-names></string-name>. <article-title>Harnessing model organism genomics to underpin the machine learning-based prediction of essential genes in eukaryotes - Biotechnological implications</article-title>. <source>Biotechnol Adv</source>. <year>2022</year>;<volume>54</volume>:<fpage>107822</fpage>.</mixed-citation></ref>
<ref id="ref4"><label>4</label><mixed-citation publication-type="journal"><string-name><surname>Thrall</surname> <given-names>JH</given-names></string-name>, <string-name><surname>Li</surname> <given-names>X</given-names></string-name>, <string-name><surname>Li</surname> <given-names>Q</given-names></string-name>, <string-name><surname>Cruz</surname> <given-names>C</given-names></string-name>, <string-name><surname>Do</surname> <given-names>S</given-names></string-name>, <string-name><surname>Dreyer</surname> <given-names>K</given-names></string-name>, <etal>et al.</etal> <article-title>Artificial intelligence and machine learning in radiology: opportunities, challenges, pitfalls, and criteria for success</article-title>. <source>J Am Coll Radiol</source>. <year>2018</year>;<volume>15</volume>(<issue>3</issue>):<fpage>504</fpage>&#x2013;<lpage>8</lpage>.</mixed-citation></ref>
<ref id="ref5"><label>5</label><mixed-citation publication-type="journal"><string-name><surname>Yan</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Borhani</surname> <given-names>TN</given-names></string-name>, <string-name><surname>Subraveti</surname> <given-names>SG</given-names></string-name>, <string-name><surname>Pai</surname> <given-names>KN</given-names></string-name>, <string-name><surname>Prasad</surname> <given-names>V</given-names></string-name>, <string-name><surname>Rajendran</surname> <given-names>A</given-names></string-name>, <etal>et al.</etal> <article-title>Harnessing the power of machine learning for carbon capture, utilisation, and storage (CCUS)-a state-of-the-art review</article-title>. <source>Energy Environ Sci</source>. <year>2021</year>;<volume>14</volume>(<issue>12</issue>):<fpage>6122</fpage>&#x2013;<lpage>57</lpage>.</mixed-citation></ref>
<ref id="ref6"><label>6</label><mixed-citation publication-type="journal"><string-name><surname>Ansari</surname> <given-names>AQ</given-names></string-name>, <string-name><surname>Gupta</surname> <given-names>NK</given-names></string-name>. <article-title>Automated diagnosis of coronary heart disease using neuro-fuzzy integrated system</article-title>. <source>2011 World Congress on Information and Communication Technologies, Mumbai, India</source>. <year>2011</year>. pp. <fpage>1379</fpage>&#x2013;<lpage>84</lpage>.</mixed-citation></ref>
<ref id="ref7"><label>7</label><mixed-citation publication-type="journal"><string-name><surname>Ahsan</surname> <given-names>MM</given-names></string-name>, <string-name><surname>Mahmud</surname> <given-names>MAP</given-names></string-name>, <string-name><surname>Saha</surname> <given-names>PK</given-names></string-name>, <string-name><surname>Gupta</surname> <given-names>KD</given-names></string-name>, <string-name><surname>Siddique</surname> <given-names>Z</given-names></string-name>. <article-title>Effect of data scaling methods on machine learning algorithms and model performance</article-title>. <source>Technologies</source>. <year>2021</year>;<volume>9</volume>(<issue>3</issue>):<fpage>5</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref8"><label>8</label><mixed-citation publication-type="journal"><string-name><surname>Rubin</surname> <given-names>J</given-names></string-name>, <string-name><surname>Abreu</surname> <given-names>R</given-names></string-name>, <string-name><surname>Ganguli</surname> <given-names>A</given-names></string-name>, <string-name><surname>Nelaturi</surname> <given-names>S</given-names></string-name>, <string-name><surname>Matei</surname> <given-names>I</given-names></string-name>, <string-name><surname>Sricharan</surname> <given-names>K</given-names></string-name>. <article-title>Recognizing abnormal heart sounds using deep learning</article-title>. <source>CEUR Workshop Proc</source>. <year>2017</year>;<volume>1891</volume>:<fpage>13</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref9"><label>9</label><mixed-citation publication-type="journal"><string-name><surname>Miao</surname> <given-names>JH</given-names></string-name>, <string-name><surname>Miao</surname> <given-names>KH</given-names></string-name>. <article-title>Cardiotocographic diagnosis of fetal health based on multiclass morphologic pattern predictions using deep learning classification</article-title>. <source>Int J Adv Comput Sci Appl</source>. <year>2018</year>;<volume>9</volume>(<issue>5</issue>):<fpage>1</fpage>&#x2013;<lpage>11</lpage>.</mixed-citation></ref>
<ref id="ref10"><label>10</label><mixed-citation publication-type="journal"><string-name><surname>Khader Basha</surname> <given-names>S</given-names></string-name>, <string-name><surname>Roja</surname> <given-names>D</given-names></string-name>, <string-name><surname>Priya</surname> <given-names>SS</given-names></string-name>, <string-name><surname>Dalavi</surname> <given-names>L</given-names></string-name>, <string-name><surname>Vellela</surname> <given-names>SS</given-names></string-name>, <string-name><surname>Venkateswara Reddy</surname> <given-names>B</given-names></string-name>. <article-title>Coronary heart disease prediction and classification using hybrid machine learning algorithms</article-title>. <source>2023 International Conference on Innovative Data Communication Technologies and Application (ICIDCA), Uttarakhand, India</source>. <year>2023</year>. pp. <fpage>7</fpage>&#x2013;<lpage>13</lpage>.</mixed-citation></ref>
<ref id="ref11"><label>11</label><mixed-citation publication-type="journal"><string-name><surname>Chandrasekhar</surname> <given-names>N</given-names></string-name>, <string-name><surname>Peddakrishna</surname> <given-names>S</given-names></string-name>. <article-title>Enhancing heart disease prediction accuracy through machine learning techniques and optimization</article-title>. <source>Processes</source>. <year>2023</year>;<volume>11</volume>(<issue>4</issue>):<fpage>1210</fpage>.</mixed-citation></ref>
<ref id="ref12"><label>12</label><mixed-citation publication-type="journal"><string-name><surname>Ahsan</surname> <given-names>MM</given-names></string-name>, <string-name><surname>Siddique</surname> <given-names>Z</given-names></string-name>. <article-title>Machine learning-based heart disease diagnosis: a systematic literature review</article-title>. <source>Artif Intell Med</source>. <year>2022</year>;<volume>128</volume>:<fpage>102289</fpage>.</mixed-citation></ref>
<ref id="ref13"><label>13</label><mixed-citation publication-type="journal"><string-name><surname>Bemando</surname> <given-names>C</given-names></string-name>, <string-name><surname>Miranda</surname> <given-names>E</given-names></string-name>, <string-name><surname>Aryuni</surname> <given-names>M</given-names></string-name>. <article-title>Machine-learning-based prediction models of coronary heart disease using Na&#x00EF;ve Bayes and random forest algorithms</article-title>. <source>2021 International Conference on Software Engineering &#x0026; Computer Systems and 4th International Conference on Computational Science and Information Management (ICSECS-ICOCSIM), Pekan, Malaysia</source>. <year>2021</year>. pp. <fpage>232</fpage>&#x2013;<lpage>7</lpage>.</mixed-citation></ref>
<ref id="ref14"><label>14</label><mixed-citation publication-type="book"><string-name><surname>Kumar</surname> <given-names>RR</given-names></string-name>, <string-name><surname>Pallavi</surname> <given-names>S</given-names></string-name>, <string-name><surname>Laxmi</surname> <given-names>KR</given-names></string-name>, <string-name><surname>Ramya</surname> <given-names>N</given-names></string-name>, <string-name><surname>Raja</surname> <given-names>R</given-names></string-name>. <chapter-title>Performance comparison of random forest classifier and convolution neural network in predicting heart diseases</chapter-title>. <source>In Advances in Intelligent Systems and Computing</source>. <year>2020</year> (Vol. <volume>1090</volume>, pp. <fpage>821</fpage>&#x2013;<lpage>28</lpage>). <publisher-name>Springer</publisher-name>.</mixed-citation></ref>
<ref id="ref15"><label>15</label><mixed-citation publication-type="journal"><string-name><surname>Singh</surname> <given-names>H</given-names></string-name>, <string-name><surname>Navaneeth</surname> <given-names>NV</given-names></string-name>, <string-name><surname>Pillai</surname> <given-names>GN</given-names></string-name>. <article-title>Multisurface proximal SVM based decision trees for heart disease classification</article-title>. In: <source>IEEE Region 10 Annual International Conference, Proceedings/TENCON. IEEE</source>; <year>2019</year>. pp. <fpage>13</fpage>&#x2013;<lpage>8</lpage>.</mixed-citation></ref>
<ref id="ref16"><label>16</label><mixed-citation publication-type="journal"><string-name><surname>Desai</surname> <given-names>SD</given-names></string-name>, <string-name><surname>Giraddi</surname> <given-names>S</given-names></string-name>, <string-name><surname>Narayankar</surname> <given-names>P</given-names></string-name>, <string-name><surname>Pudakalakatti</surname> <given-names>NR</given-names></string-name>, <string-name><surname>Sulegaon</surname> <given-names>S</given-names></string-name>. <article-title>Back-propagation neural network versus logistic regression in heart disease classification</article-title>. <source>Adv Intell Syst Comput</source>. <year>2019</year>;<volume>702</volume>:<fpage>133</fpage>&#x2013;<lpage>44</lpage>.</mixed-citation></ref>
<ref id="ref17"><label>17</label><mixed-citation publication-type="journal"><string-name><surname>Patil</surname> <given-names>DD</given-names></string-name>, <string-name><surname>Singh</surname> <given-names>RP</given-names></string-name>, <string-name><surname>Thakare</surname> <given-names>VM</given-names></string-name>, <string-name><surname>Gulve</surname> <given-names>AK</given-names></string-name>. <article-title>Analysis of ECG arrhythmia for heart disease detection using SVM and Cuckoo search optimized neural network</article-title>. <source>Int J Eng Technol</source>. <year>2018</year>;<volume>7</volume>(<issue>2</issue>):<fpage>27</fpage>&#x2013;<lpage>33</lpage>.</mixed-citation></ref>
<ref id="ref18"><label>18</label><mixed-citation publication-type="journal"><string-name><surname>Acharya</surname> <given-names>UR</given-names></string-name>, <string-name><surname>Oh</surname> <given-names>SL</given-names></string-name>, <string-name><surname>Hagiwara</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Tan</surname> <given-names>JH</given-names></string-name>, <string-name><surname>Adam</surname> <given-names>M</given-names></string-name>, <string-name><surname>Gertych</surname> <given-names>A</given-names></string-name>, <etal>et al.</etal> <article-title>A deep convolutional neural network model to classify heartbeats</article-title>. <source>Comput Biol Med</source>. <year>2017</year>;<volume>89</volume>:<fpage>389</fpage>&#x2013;<lpage>96</lpage>.</mixed-citation></ref>
<ref id="ref19"><label>19</label><mixed-citation publication-type="journal"><string-name><surname>Yang</surname> <given-names>W</given-names></string-name>, <string-name><surname>Si</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Wang</surname> <given-names>D</given-names></string-name>, <string-name><surname>Guo</surname> <given-names>B</given-names></string-name>. <article-title>Automatic recognition of arrhythmia based on principal component analysis network and linear support vector machine</article-title>. <source>Comput Biol Med</source>. <year>2018</year>;<volume>101</volume>:<fpage>22</fpage>&#x2013;<lpage>32</lpage>.</mixed-citation></ref>
<ref id="ref20"><label>20</label><mixed-citation publication-type="journal"><string-name><surname>Levey</surname> <given-names>AS</given-names></string-name>, <string-name><surname>Coresh</surname> <given-names>J</given-names></string-name>. <article-title>Chronic kidney disease</article-title>. <source>Lancet</source>. <year>2012</year>;<volume>379</volume>(<issue>9811</issue>):<fpage>165</fpage>&#x2013;<lpage>80</lpage>.</mixed-citation></ref>
<ref id="ref21"><label>21</label><mixed-citation publication-type="journal"><string-name><surname>Charleonnan</surname> <given-names>A</given-names></string-name>, <string-name><surname>Fufaung</surname> <given-names>T</given-names></string-name>, <string-name><surname>Niyomwong</surname> <given-names>T</given-names></string-name>, <string-name><surname>Chokchueypattanakit</surname> <given-names>W</given-names></string-name>, <string-name><surname>Suwannawach</surname> <given-names>S</given-names></string-name>, <string-name><surname>Ninchawee</surname> <given-names>N</given-names></string-name>. <article-title>Predictive analytics for chronic kidney disease using machine learning techniques</article-title>. <source>2016 Management and Innovation Technology International Conference (MITicon), Bang-San, Thailand</source>. <year>2016</year>. pp. MIT-80-MIT-83.</mixed-citation></ref>
<ref id="ref22"><label>22</label><mixed-citation publication-type="journal"><string-name><surname>Aljaaf</surname> <given-names>AJ</given-names></string-name>, Al-<string-name><surname>Jumeily</surname> <given-names>D</given-names></string-name>, <string-name><surname>Haglan</surname> <given-names>HM</given-names></string-name>, <string-name><surname>Alloghani</surname> <given-names>M</given-names></string-name>, <string-name><surname>Baker</surname> <given-names>T</given-names></string-name>, <string-name><surname>Hussain</surname> <given-names>AJ</given-names></string-name>, <etal>et al.</etal> <article-title>Early prediction of chronic kidney disease using machine learning supported by predictive analytics</article-title>. <source>2018 IEEE Congress on Evolutionary Computation (CEC), Rio de Janeiro, Brazil</source>. <year>2018</year>. pp. <fpage>1</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref23"><label>23</label><mixed-citation publication-type="journal"><string-name><surname>Ma</surname> <given-names>F</given-names></string-name>, <string-name><surname>Sun</surname> <given-names>T</given-names></string-name>, <string-name><surname>Liu</surname> <given-names>L</given-names></string-name>, <string-name><surname>Jing</surname> <given-names>H</given-names></string-name>. <article-title>Detection and diagnosis of chronic kidney disease using deep learning-based heterogeneous modified artificial neural network</article-title>. <source>Futur Gener Comput Syst</source>. <year>2020</year>;111:<fpage>17</fpage>&#x2013;<lpage>26</lpage>.</mixed-citation></ref>
<ref id="ref24"><label>24</label><mixed-citation publication-type="journal"><string-name><surname>Islam</surname> <given-names>MA</given-names></string-name>, <string-name><surname>Majumder</surname> <given-names>MZH</given-names></string-name>, <string-name><surname>Hussein</surname> <given-names>MA</given-names></string-name>. <article-title>Chronic kidney disease prediction based on machine learning algorithms</article-title>. <source>J Pathol Inform</source>. <year>2023</year>;<volume>14</volume>:<fpage>100189</fpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jpi.2023.100189">https://doi.org/10.1016/j.jpi.2023.100189</ext-link></mixed-citation></ref>
<ref id="ref25"><label>25</label><mixed-citation publication-type="journal"><string-name><surname>Sawhney</surname> <given-names>R</given-names></string-name>, <string-name><surname>Malik</surname> <given-names>A</given-names></string-name>, <string-name><surname>Sharma</surname> <given-names>S</given-names></string-name>, <string-name><surname>Narayan</surname> <given-names>V</given-names></string-name>. <article-title>A comparative assessment of artificial intelligence models used for early prediction and evaluation of chronic kidney disease</article-title>. <source>Decis Anal J</source>. <year>2023</year>;<volume>6</volume>:<fpage>100169</fpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.dajour.2023.100169">https://doi.org/10.1016/j.dajour.2023.100169</ext-link></mixed-citation></ref>
<ref id="ref26"><label>26</label><mixed-citation publication-type="book"><string-name><surname>Sahani</surname> <given-names>A</given-names></string-name>, <string-name><surname>Arya</surname> <given-names>J</given-names></string-name>, <string-name><surname>Patro</surname> <given-names>A</given-names></string-name>, <string-name><surname>Priyadarshini</surname> <given-names>SBB</given-names></string-name>. <chapter-title>Effective use of Na&#x00EF;ve Bayes, decision tree, and random forest techniques for analysis of chronic kidney disease</chapter-title>. <source>In Smart Innovation, Systems and Technologies</source> <year>2021</year>; (Vol. <volume>194</volume>, pp. <fpage>813</fpage>&#x2013;<lpage>818</lpage>). <publisher-name>Springer</publisher-name>.</mixed-citation></ref>
<ref id="ref27"><label>27</label><mixed-citation publication-type="journal"><string-name><surname>Nithya</surname> <given-names>A</given-names></string-name>, <string-name><surname>Appathurai</surname> <given-names>A</given-names></string-name>, <string-name><surname>Venkatadri</surname> <given-names>N</given-names></string-name>, <string-name><surname>Ramji</surname> <given-names>DR</given-names></string-name>, <string-name><surname>Anna Palagan</surname> <given-names>C</given-names></string-name>. <article-title>Kidney disease detection and segmentation using artificial neural network and multi-kernel k-means clustering for ultrasound images</article-title>. <source>Meas J Int Meas Confed</source>. <year>2020</year>;<volume>149</volume>:<fpage>106952</fpage>.</mixed-citation></ref>
<ref id="ref28"><label>28</label><mixed-citation publication-type="journal"><string-name><surname>Imran</surname> <given-names>AAl</given-names></string-name>, <string-name><surname>Amin</surname> <given-names>MN</given-names></string-name>, <string-name><surname>Johora</surname> <given-names>FT</given-names></string-name>. <article-title>Classification of chronic kidney disease using logistic regression, feedforward neural network and wide deep learning</article-title>. <source>2018 International Conference on Innovation in Engineering and Technology (ICIET), Dhaka, Bangladesh</source>. <year>2018</year>. pp. <fpage>1</fpage>&#x2013;<lpage>6</lpage>.</mixed-citation></ref>
<ref id="ref29"><label>29</label><mixed-citation publication-type="journal"><string-name><surname>Navaneeth</surname> <given-names>B</given-names></string-name>, <string-name><surname>Suchetha</surname> <given-names>M</given-names></string-name>. <article-title>A dynamic pooling based convolutional neural network approach to detect chronic kidney disease</article-title>. <source>Biomed Signal Process Control</source>. <year>2020</year>;<volume>62</volume>:<fpage>102068</fpage>.</mixed-citation></ref>
<ref id="ref30"><label>30</label><mixed-citation publication-type="journal"><string-name><surname>Brunetti</surname> <given-names>A</given-names></string-name>, Cascarano, <string-name><surname>Donato</surname> <given-names>G</given-names></string-name>, <string-name><surname>Bevilacqua</surname> <given-names>V</given-names></string-name>. <article-title>Detection and Segmentation of Kidneys from Magnetic Resonance Images in Patients with Autosomal Dominant Polycystic Kidney Disease</article-title>. <source>Springer</source>. <year>2019</year>. pp. <fpage>639</fpage>&#x2013;<lpage>50</lpage>.</mixed-citation></ref>
<ref id="ref31"><label>31</label><mixed-citation publication-type="journal"><string-name><surname>Miranda</surname> <given-names>GHB</given-names></string-name>, <string-name><surname>Felipe</surname> <given-names>JC</given-names></string-name>. <article-title>Computer-aided diagnosis system based on fuzzy logic for breast cancer categorization</article-title>. <source>Comput Biol Med</source>. <year>2015</year>;64:<fpage>334</fpage>&#x2013;<lpage>46</lpage>.</mixed-citation></ref>
<ref id="ref32"><label>32</label><mixed-citation publication-type="journal"><string-name><surname>Zheng</surname> <given-names>B</given-names></string-name>, <string-name><surname>Yoon</surname> <given-names>SW</given-names></string-name>, <string-name><surname>Lam</surname> <given-names>SS</given-names></string-name>. <article-title>Breast cancer diagnosis based on feature extraction using a hybrid of K-means and support vector machine algorithms</article-title>. <source>Expert Syst Appl</source>. <year>2014</year>;<volume>41</volume>(<issue>4 PART 1</issue>):<fpage>1476</fpage>&#x2013;<lpage>82</lpage>.</mixed-citation></ref>
<ref id="ref33"><label>33</label><mixed-citation publication-type="journal"><string-name><surname>Asri</surname> <given-names>H</given-names></string-name>, <string-name><surname>Mousannif</surname> <given-names>H</given-names></string-name>, Al <string-name><surname>Moatassime</surname> <given-names>H</given-names></string-name>, <string-name><surname>Noel</surname> <given-names>T</given-names></string-name>. <article-title>Using machine learning algorithms for breast cancer risk prediction and diagnosis</article-title>. <source>Procedia Comput Sci</source>. <year>2016</year>;<volume>83</volume>:<fpage>1064</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref34"><label>34</label><mixed-citation publication-type="book"><string-name><surname>Mohammed</surname> <given-names>SA</given-names></string-name>, <string-name><surname>Darrab</surname> <given-names>S</given-names></string-name>, <string-name><surname>Noaman</surname> <given-names>SA</given-names></string-name>, <string-name><surname>Saake</surname> <given-names>G</given-names></string-name>. <chapter-title>Analysis of breast cancer detection using different machine learning techniques</chapter-title>. <source>In CCIS, Communications in Computer and Information Science</source> <year>2020</year>;(Vol. <volume>1234</volume>, pp. <fpage>108</fpage>&#x2013;<lpage>117</lpage>). <publisher-name>Springer</publisher-name>.</mixed-citation></ref>
<ref id="ref35"><label>35</label><mixed-citation publication-type="journal"><string-name><surname>Assegie</surname> <given-names>TA</given-names></string-name>. <article-title>An optimized K-Nearest neighbor based breast cancer detection</article-title>. <source>J Robot Control</source>. <year>2021</year>;<volume>2</volume>(<issue>3</issue>):<fpage>115</fpage>&#x2013;<lpage>8</lpage>.</mixed-citation></ref>
<ref id="ref36"><label>36</label><mixed-citation publication-type="journal"><string-name><surname>Bhattacherjee</surname> <given-names>A</given-names></string-name>, <string-name><surname>Roy</surname> <given-names>S</given-names></string-name>, <string-name><surname>Paul</surname> <given-names>S</given-names></string-name>, <string-name><surname>Roy</surname> <given-names>P</given-names></string-name>, <string-name><surname>Kausar</surname> <given-names>N</given-names></string-name>, <string-name><surname>Dey</surname> <given-names>N</given-names></string-name>. <article-title>Classification approach for breast cancer detection using back propagation neural network</article-title>. <source>Deep Learn Neural Networks</source>. <year>2019</year>;<fpage>1410</fpage>&#x2013;<lpage>21</lpage>.</mixed-citation></ref>
<ref id="ref37"><label>37</label><mixed-citation publication-type="journal"><string-name><surname>Alshayeji</surname> <given-names>MH</given-names></string-name>, <string-name><surname>Ellethy</surname> <given-names>H</given-names></string-name>, <string-name><surname>Abed</surname> <given-names>S</given-names></string-name>, <string-name><surname>Gupta</surname> <given-names>R</given-names></string-name>. <article-title>Computer-aided detection of breast cancer on the Wisconsin dataset: an artificial neural networks approach</article-title>. <source>Biomed Signal Process Control</source>. <year>2022</year>;<volume>71</volume>:<fpage>103141</fpage>.</mixed-citation></ref>
<ref id="ref38"><label>38</label><mixed-citation publication-type="journal"><string-name><surname>Sultana</surname> <given-names>Z</given-names></string-name>, Rahman <string-name><surname>Khan</surname> <given-names>MA</given-names></string-name>, <string-name><surname>Jahan</surname> <given-names>N</given-names></string-name>. <article-title>Early breast cancer detection utilizing artificial neural network</article-title>. <source>Wseas Trans Biol Biomed</source>. <year>2021</year>;18:<fpage>32</fpage>&#x2013;<lpage>42</lpage>.</mixed-citation></ref>
<ref id="ref39"><label>39</label><mixed-citation publication-type="journal"><string-name><surname>Ghosh</surname> <given-names>P</given-names></string-name>, <string-name><surname>Azam</surname> <given-names>S</given-names></string-name>, <string-name><surname>Hasib</surname> <given-names>KM</given-names></string-name>, <string-name><surname>Karim</surname> <given-names>A</given-names></string-name>, <string-name><surname>Jonkman</surname> <given-names>M</given-names></string-name>, <string-name><surname>Anwar</surname> <given-names>A</given-names></string-name>. <article-title>A performance based study on deep learning algorithms in the effective prediction of breast cancer</article-title>. <source>2021 International Joint Conference on Neural Networks (IJCNN), Shenzhen, China</source>. <year>2021</year>. pp. <fpage>1</fpage>&#x2013;<lpage>8</lpage>.</mixed-citation></ref>
<ref id="ref40"><label>40</label><mixed-citation publication-type="journal"><string-name><surname>Das</surname> <given-names>AK</given-names></string-name>, <string-name><surname>Biswas</surname> <given-names>SK</given-names></string-name>, <string-name><surname>Mandal</surname> <given-names>A</given-names></string-name>, <string-name><surname>Bhattacharya</surname> <given-names>A</given-names></string-name>, <string-name><surname>Sanyal</surname> <given-names>S</given-names></string-name>. <article-title>Machine learning based intelligent system for breast cancer prediction (MLISBCP)</article-title>. <source>Expert Syst Appl</source>. <year>2024</year>;<volume>242</volume>:<fpage>122673</fpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.eswa.2023.122673">https://doi.org/10.1016/j.eswa.2023.122673</ext-link></mixed-citation></ref>
<ref id="ref41"><label>41</label><mixed-citation publication-type="journal"><string-name><surname>Shafique</surname> <given-names>R</given-names></string-name>, <string-name><surname>Rustam</surname> <given-names>F</given-names></string-name>, <string-name><surname>Choi</surname> <given-names>GS</given-names></string-name>, <string-name><surname>D&#x00ED;ez I dela</surname> <given-names>T</given-names></string-name>, <string-name><surname>Mahmood</surname> <given-names>A</given-names></string-name>, <string-name><surname>Lipari</surname> <given-names>V</given-names></string-name>, <etal>et al.</etal> <article-title>Breast cancer prediction using fine needle aspiration features and upsampling with supervised machine learning</article-title>. <source>Cancers (Basel)</source>. <year>2023</year>;<volume>15</volume>(<issue>3</issue>):<fpage>1</fpage>&#x2013;<lpage>21</lpage>.</mixed-citation></ref>
<ref id="ref42"><label>42</label><mixed-citation publication-type="journal"><string-name><surname>Rajendran</surname> <given-names>K</given-names></string-name>, <string-name><surname>Jayabalan</surname> <given-names>M</given-names></string-name>, <string-name><surname>Thiruchelvam</surname> <given-names>V</given-names></string-name>. <article-title>Predicting breast cancer via supervised machine learning methods on class imbalanced data</article-title>. <source>Int J Adv Comput Sci Appl</source>. <year>2020</year>;<volume>11</volume>(<issue>8</issue>):<fpage>54</fpage>&#x2013;<lpage>63</lpage>.</mixed-citation></ref>
<ref id="ref43"><label>43</label><mixed-citation publication-type="journal"><string-name><surname>Abdel-Nasser</surname> <given-names>M</given-names></string-name>, <string-name><surname>Rashwan</surname> <given-names>HA</given-names></string-name>, <string-name><surname>Puig</surname> <given-names>D</given-names></string-name>, <string-name><surname>Moreno</surname> <given-names>A</given-names></string-name>. <article-title>Analysis of tissue abnormality and breast density in mammographic images using a uniform local directional pattern</article-title>. <source>Expert Syst Appl</source>. <year>2015</year>;<volume>42</volume>(<issue>24</issue>):<fpage>9499</fpage>&#x2013;<lpage>511</lpage>.</mixed-citation></ref>
<ref id="ref44"><label>44</label><mixed-citation publication-type="journal"><string-name><surname>Sharma</surname> <given-names>S</given-names></string-name>, <string-name><surname>Khanna</surname> <given-names>P</given-names></string-name>. <article-title>Computer-aided diagnosis of malignant mammograms using Zernike moments and SVM</article-title>. <source>J Digit Imaging</source>. <year>2015</year>;<volume>28</volume>(<issue>1</issue>):<fpage>77</fpage>&#x2013;<lpage>90</lpage>.</mixed-citation></ref>
<ref id="ref45"><label>45</label><mixed-citation publication-type="journal"><string-name><surname>Moon</surname> <given-names>WK</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>IL</given-names></string-name>, <string-name><surname>Chang</surname> <given-names>JM</given-names></string-name>, <string-name><surname>Shin</surname> <given-names>SU</given-names></string-name>, <string-name><surname>Lo</surname> <given-names>CM</given-names></string-name>, <string-name><surname>Chang</surname> <given-names>RF</given-names></string-name>. <article-title>The adaptive computer-aided diagnosis system based on tumor sizes for the classification of breast tumors detected at screening ultrasound</article-title>. <source>Ultrasonics</source>. <year>2017</year>;<volume>76</volume>:<fpage>70</fpage>&#x2013;<lpage>7</lpage>.</mixed-citation></ref>
<ref id="ref46"><label>46</label><mixed-citation publication-type="journal"><string-name><surname>Lo</surname> <given-names>CM</given-names></string-name>, <string-name><surname>Chan</surname> <given-names>SW</given-names></string-name>, <string-name><surname>Yang</surname> <given-names>YW</given-names></string-name>, <string-name><surname>Chang</surname> <given-names>YC</given-names></string-name>, <string-name><surname>Huang</surname> <given-names>CS</given-names></string-name>, <string-name><surname>Jou</surname> <given-names>YS</given-names></string-name>, <etal>et al.</etal> <article-title>Feasibility testing: three-dimensional tumor mapping in different orientations of automated breast ultrasound</article-title>. <source>Ultrasound Med Biol</source>. <year>2016</year>;<volume>42</volume>(<issue>5</issue>):<fpage>1201</fpage>&#x2013;<lpage>10</lpage>.</mixed-citation></ref>
<ref id="ref47"><label>47</label><mixed-citation publication-type="journal"><string-name><surname>Venkatesh</surname> <given-names>SS</given-names></string-name>, <string-name><surname>Levenback</surname> <given-names>BJ</given-names></string-name>, <string-name><surname>Sultan</surname> <given-names>LR</given-names></string-name>, <string-name><surname>Bouzghar</surname> <given-names>G</given-names></string-name>, <string-name><surname>Sehgal</surname> <given-names>CM</given-names></string-name>. <article-title>Going beyond a first reader: a machine learning methodology for optimizing cost and performance in breast ultrasound diagnosis</article-title>. <source>Ultrasound Med Biol</source>. <year>2015</year>;<volume>41</volume>(<issue>12</issue>):<fpage>3148</fpage>&#x2013;<lpage>62</lpage>.</mixed-citation></ref>
<ref id="ref48"><label>48</label><mixed-citation publication-type="journal"><string-name><surname>Naz</surname> <given-names>H</given-names></string-name>, <string-name><surname>Ahuja</surname> <given-names>S</given-names></string-name>. <article-title>Deep learning approach for diabetes prediction using PIMA Indian dataset</article-title>. <source>J Diabetes Metab Disord</source>. <year>2020</year>;<volume>19</volume>(<issue>1</issue>):<fpage>391</fpage>&#x2013;<lpage>403</lpage>.</mixed-citation></ref>
<ref id="ref49"><label>49</label><mixed-citation publication-type="journal"><string-name><surname>Kandhasamy</surname> <given-names>JP</given-names></string-name>, <string-name><surname>Balamurali</surname> <given-names>S</given-names></string-name>. <article-title>Performance analysis of classifier models to predict diabetes mellitus</article-title>. <source>Procedia Comput Sci</source>. <year>2015</year>;<volume>47</volume>(<issue>C</issue>):<fpage>45</fpage>&#x2013;<lpage>51</lpage>.</mixed-citation></ref>
<ref id="ref50"><label>50</label><mixed-citation publication-type="journal"><string-name><surname>Yahyaoui</surname> <given-names>A</given-names></string-name>, <string-name><surname>Jamil</surname> <given-names>A</given-names></string-name>, <string-name><surname>Rasheed</surname> <given-names>J</given-names></string-name>, <string-name><surname>Yesiltepe</surname> <given-names>M</given-names></string-name>. <article-title>A decision support system for diabetes prediction using machine learning and deep learning techniques</article-title>. <source>2019 1st International Informatics and Software Engineering Conference (UBMYK), Ankara, Turkey</source>. <year>2019</year>. pp. <fpage>1</fpage>&#x2013;<lpage>4</lpage>.</mixed-citation></ref>
<ref id="ref51"><label>51</label><mixed-citation publication-type="journal"><string-name><surname>Ashiquzzaman</surname> <given-names>A</given-names></string-name>, <string-name><surname>Tushar</surname> <given-names>AK</given-names></string-name>, <string-name><surname>Islam</surname> <given-names>MR</given-names></string-name>, <string-name><surname>Shon</surname> <given-names>D</given-names></string-name>, <string-name><surname>Im</surname> <given-names>K</given-names></string-name>, <string-name><surname>Park</surname> <given-names>JH</given-names></string-name>, <etal>et al.</etal> <article-title>Reduction of overfitting in diabetes prediction using deep learning neural network</article-title>. <source>Lect Notes Electr Eng</source>. <year>2017</year>;<volume>449</volume>:<fpage>35</fpage>&#x2013;<lpage>43</lpage>.</mixed-citation></ref>
<ref id="ref52"><label>52</label><mixed-citation publication-type="book"><string-name><surname>Alhassan</surname> <given-names>Z</given-names></string-name>, <string-name><surname>McGough</surname> <given-names>AS</given-names></string-name>, <string-name><surname>Alshammari</surname> <given-names>R</given-names></string-name>, <string-name><surname>Daghstani</surname> <given-names>T</given-names></string-name>, <string-name><surname>Budgen</surname> <given-names>D</given-names></string-name>, <string-name><surname>Al Moubayed</surname> <given-names>N</given-names></string-name>. <chapter-title>Type-2 diabetes mellitus diagnosis from time series clinical data using deep learning models</chapter-title>. In <string-name><surname>K&#x016F;rkov&#x00E1;</surname> <given-names>V</given-names></string-name>, <string-name><surname>Manolopoulos</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Hammer</surname> <given-names>B</given-names></string-name>, <string-name><surname>Iliadis</surname> <given-names>L</given-names></string-name>, <string-name><surname>Maglogiannis</surname> <given-names>I</given-names></string-name>, eds. <source>Artificial Neural Networks and Machine Learning - ICANN 2018. ICANN 2018. Lecture Notes in Computer Science</source> <year>2018</year>;(Vol. <volume>11141</volume>, pp. <fpage>468</fpage>&#x2013;<lpage>78</lpage>). <publisher-name>Springer</publisher-name>.</mixed-citation></ref>
<ref id="ref53"><label>53</label><mixed-citation publication-type="journal"><string-name><surname>Febrian</surname> <given-names>ME</given-names></string-name>, <string-name><surname>Ferdinan</surname> <given-names>FX</given-names></string-name>, <string-name><surname>Sendani</surname> <given-names>GP</given-names></string-name>, <string-name><surname>Suryanigrum</surname> <given-names>KM</given-names></string-name>, <string-name><surname>Yunanda</surname> <given-names>R</given-names></string-name>. <article-title>Diabetes prediction using supervised machine learning</article-title>. <source>Procedia Comput Sci</source>. <year>2022</year>;<volume>216</volume>(<issue>2022</issue>):<fpage>21</fpage>&#x2013;<lpage>30</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.procs.2022.12.107">https://doi.org/10.1016/j.procs.2022.12.107</ext-link></mixed-citation></ref>
<ref id="ref54"><label>54</label><mixed-citation publication-type="journal"><string-name><surname>Modak</surname> <given-names>SKS</given-names></string-name>, <string-name><surname>Jha</surname> <given-names>VK</given-names></string-name>. <article-title>Diabetes prediction model using machine learning techniques</article-title>. <source>Multimed Tools Appl</source>. <year>2024</year>;<volume>83</volume>(<issue>13</issue>):<fpage>38523</fpage>&#x2013;<lpage>49</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11042-023-16745-4">https://doi.org/10.1007/s11042-023-16745-4</ext-link></mixed-citation></ref>
<ref id="ref55"><label>55</label><mixed-citation publication-type="journal"><string-name><surname>Fitriyani</surname> <given-names>NL</given-names></string-name>, <string-name><surname>Syafrudin</surname> <given-names>M</given-names></string-name>, <string-name><surname>Alfian</surname> <given-names>G</given-names></string-name>, <string-name><surname>Rhee</surname> <given-names>J</given-names></string-name>. <article-title>Development of disease prediction model based on ensemble learning approach for diabetes and hypertension</article-title>. <source>IEEE Access</source>. <year>2019</year>;7:<fpage>144777</fpage>&#x2013;<lpage>89</lpage>.</mixed-citation></ref>
<ref id="ref56"><label>56</label><mixed-citation publication-type="journal"><string-name><surname>Fern&#x00E1;ndez-Edreira</surname> <given-names>D</given-names></string-name>, <string-name><surname>Li&#x00F1;ares-Blanco</surname> <given-names>J</given-names></string-name>, <string-name><surname>Fernandez-Lozano</surname> <given-names>C</given-names></string-name>. <article-title>Machine learning analysis of the human infant gut microbiome identifies influential species in type 1 diabetes</article-title>. <source>Expert Syst Appl</source>. <year>2021</year>;<volume>185</volume>:<fpage>115648</fpage>.</mixed-citation></ref>
<ref id="ref57"><label>57</label><mixed-citation publication-type="journal"><string-name><surname>Ali</surname> <given-names>A</given-names></string-name>, <string-name><surname>Alrubei</surname> <given-names>M</given-names></string-name>, <string-name><surname>Hassan</surname> <given-names>LFM</given-names></string-name>, <string-name><surname>Al-Ja&#x2019;afari</surname> <given-names>M</given-names></string-name>, <string-name><surname>Abdulwahed</surname> <given-names>S</given-names></string-name>. <article-title>Diabetes diagnosis based on KNN</article-title>. <source>IIUM Eng J</source>. <year>2020</year>;<volume>21</volume>(<issue>1</issue>):<fpage>175</fpage>&#x2013;<lpage>81</lpage>.</mixed-citation></ref>
<ref id="ref58"><label>58</label><mixed-citation publication-type="journal"><string-name><surname>Tsao</surname> <given-names>HY</given-names></string-name>, <string-name><surname>Chan</surname> <given-names>PY</given-names></string-name>, <string-name><surname>Su</surname> <given-names>ECY</given-names></string-name>. <article-title>Predicting diabetic retinopathy and identifying interpretable biomedical features using machine learning algorithms</article-title>. <source>BMC Bioinformatics</source>. <year>2018</year>;<volume>19</volume>:<fpage>283</fpage>.</mixed-citation></ref>
<ref id="ref59"><label>59</label><mixed-citation publication-type="journal"><string-name><surname>Qteat</surname> <given-names>H</given-names></string-name>, <string-name><surname>Awad</surname> <given-names>M</given-names></string-name>. <article-title>Using hybrid model of particle swarm optimization and multi-layer perceptron neural networks for classification of diabetes</article-title>. <source>Int J Intell Eng Syst</source>. <year>2021</year>;<volume>14</volume>:<fpage>10</fpage>&#x2013;<lpage>22</lpage>.</mixed-citation></ref>
<ref id="ref60"><label>60</label><mixed-citation publication-type="journal"><string-name><surname>Ahsan</surname> <given-names>MM</given-names></string-name>, <string-name><surname>Nazim</surname> <given-names>R</given-names></string-name>, <string-name><surname>Siddique</surname> <given-names>Z</given-names></string-name>, <string-name><surname>Huebner</surname> <given-names>P</given-names></string-name>. <article-title>Detection of COVID-19 patients from CT scan and chest X-ray data using modified MobileNetV2 and LIME</article-title>. <source>Healthc</source>. <year>2021</year>;<volume>9</volume>(<issue>9</issue>):<fpage>1</fpage>&#x2013;<lpage>12</lpage>.</mixed-citation></ref>
<ref id="ref61"><label>61</label><mixed-citation publication-type="journal"><string-name><surname>Haghanifar</surname> <given-names>A</given-names></string-name>, <string-name><surname>Majdabadi</surname> <given-names>MM</given-names></string-name>, <string-name><surname>Choi</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Deivalakshmi</surname> <given-names>S</given-names></string-name>, <string-name><surname>Ko</surname> <given-names>S</given-names></string-name>. <article-title>COVID-CXNet: Detecting COVID-19 in frontal chest X-ray images using deep learning</article-title>. <source>Multimedia Tools Appl</source>. <year>2022</year>;<volume>81</volume>:<fpage>30615</fpage>&#x2013;<lpage>645</lpage>.</mixed-citation></ref>
<ref id="ref62"><label>62</label><mixed-citation publication-type="journal"><string-name><surname>Chen</surname> <given-names>J</given-names></string-name>, <string-name><surname>Wu</surname> <given-names>L</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>J</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>L</given-names></string-name>, <string-name><surname>Gong</surname> <given-names>D</given-names></string-name>, <string-name><surname>Zhao</surname> <given-names>Y</given-names></string-name>, <etal>et al.</etal> <article-title>Deep learning-based model for detecting 2019 novel coronavirus pneumonia on high-resolution computed tomography</article-title>. <source>Sci Rep</source>. <year>2020</year>;<volume>10</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>11</lpage>.</mixed-citation></ref>
<ref id="ref63"><label>63</label><mixed-citation publication-type="journal"><string-name><surname>Abbasian</surname> <given-names>A</given-names></string-name>, <string-name><surname>Rajabzadeh</surname> <given-names>A</given-names></string-name>, <string-name><surname>Acharya</surname> <given-names>UR</given-names></string-name>. <article-title>Application of deep learning technique to manage COVID-19 in routine clinical practice using CT images Results of 10 convolutional neural networks</article-title>. <source>Comput Biol Med</source>. <year>2020</year>;<volume>121</volume>:<fpage>103795</fpage>.</mixed-citation></ref>
<ref id="ref64"><label>64</label><mixed-citation publication-type="journal"><string-name><surname>Wang</surname> <given-names>L</given-names></string-name>, <string-name><surname>Lin</surname> <given-names>ZQ</given-names></string-name>, <string-name><surname>Wong</surname> <given-names>A</given-names></string-name>. <article-title>COVID-Net: a tailored deep convolutional neural network design for detection of COVID-19 cases from chest X-ray images</article-title>. <source>Sci Rep</source>. <year>2020</year>;<volume>10</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>12</lpage>.</mixed-citation></ref>
<ref id="ref65"><label>65</label><mixed-citation publication-type="journal"><string-name><surname>Lin</surname> <given-names>L</given-names></string-name>, <string-name><surname>Hou</surname> <given-names>H</given-names></string-name>, <string-name><surname>Lv</surname> <given-names>W</given-names></string-name>, <string-name><surname>Tao</surname> <given-names>Q</given-names></string-name>, <string-name><surname>Hospital</surname> <given-names>T</given-names></string-name>, <string-name><surname>Company</surname> <given-names>JT</given-names></string-name>, <etal>et al.</etal> <article-title>Artificial intelligence distinguishes COVID-19 from community acquired pneumonia on chest CT</article-title>. <source>Appl Intell</source>. <year>2020</year>;<volume>2019</volume>:<fpage>1</fpage>&#x2013;<lpage>5</lpage>.</mixed-citation></ref>
<ref id="ref66"><label>66</label><mixed-citation publication-type="journal"><string-name><surname>Lababidi</surname> <given-names>S</given-names></string-name>. <article-title>Covidx-net: A framework of deep learning classifiers to diagnose COVID-19 in X-ray images</article-title>. <source>Sustain Mach Intell J</source>. <year>2024</year>;<volume>6</volume>: <fpage>11055</fpage>.</mixed-citation></ref>
<ref id="ref67"><label>67</label><mixed-citation publication-type="journal"><string-name><surname>Khoudour</surname> <given-names>ME</given-names></string-name>, <string-name><surname>Biskri</surname> <given-names>I</given-names></string-name>. <article-title>Detection of coronavirus disease (COVID-19) based on deep features and support vector machine</article-title>. <source>2023 International Conference on Machine Learning and Applications (ICMLA), Jacksonville, FL, USA</source>. <year>2023</year>. p. <fpage>1332</fpage>&#x2013;<lpage>7</lpage>.</mixed-citation></ref>
<ref id="ref68"><label>68</label><mixed-citation publication-type="journal"><string-name><surname>Narin</surname> <given-names>A</given-names></string-name>, <string-name><surname>Kaya</surname> <given-names>C</given-names></string-name>, <string-name><surname>Pamuk</surname> <given-names>Z</given-names></string-name>. <article-title>Automatic detection of coronavirus disease (COVID-19) using X-ray images and deep convolutional neural networks</article-title>. <source>Pattern Anal Appl</source>. <year>2021</year>;<volume>24</volume>(<issue>3</issue>):<fpage>1207</fpage>&#x2013;<lpage>20</lpage>.</mixed-citation></ref>
<ref id="ref69"><label>69</label><mixed-citation publication-type="journal"><string-name><surname>Brunese</surname> <given-names>L</given-names></string-name>, <string-name><surname>Mercaldo</surname> <given-names>F</given-names></string-name>, <string-name><surname>Reginelli</surname> <given-names>A</given-names></string-name>, <string-name><surname>Santone</surname> <given-names>A</given-names></string-name>. <source>Explainable deep learning for pulmonary disease and coronavirus COVID-19 detection from X-rays</source>. <year>2020</year>;<volume>196</volume>:<fpage>105608</fpage>.</mixed-citation></ref>
<ref id="ref70"><label>70</label><mixed-citation publication-type="journal"><string-name><surname>Ghoshal</surname> <given-names>B</given-names></string-name>, <string-name><surname>Tucker</surname> <given-names>A</given-names></string-name>. <article-title>Estimating uncertainty and interpretability in deep learning for coronavirus (COVID-19) detection</article-title>. <source>arXiv:2003.10769</source>. <year>2020</year>;<fpage>1</fpage>&#x2013;<lpage>14</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.48550/arXiv.2003.10769">https://doi.org/10.48550/arXiv.2003.10769</ext-link></mixed-citation></ref>
<ref id="ref71"><label>71</label><mixed-citation publication-type="journal"><string-name><surname>Apostolopoulos</surname> <given-names>ID</given-names></string-name>, <string-name><surname>Mpesiana</surname> <given-names>TA</given-names></string-name>. <article-title>Automatic detection from X-ray images utilizing transfer learning with convolutional neural networks</article-title>. <source>Phys Eng Sci Med</source>. <year>2020</year>;<volume>43</volume>(<issue>2</issue>):<fpage>635</fpage>&#x2013;<lpage>40</lpage>.</mixed-citation></ref>
<ref id="ref72"><label>72</label><mixed-citation publication-type="journal"><string-name><surname>Solayman</surname> <given-names>S</given-names></string-name>, <string-name><surname>Aumi</surname> <given-names>SA</given-names></string-name>, <string-name><surname>Mery</surname> <given-names>CS</given-names></string-name>, <string-name><surname>Mubassir</surname> <given-names>M</given-names></string-name>, <string-name><surname>Khan</surname> <given-names>R</given-names></string-name>. <article-title>Automatic COVID-19 prediction using explainable machine learning techniques</article-title>. <source>Int J Cogn Comput Eng</source>. <year>2023</year>;<volume>4</volume>:<fpage>36</fpage>&#x2013;<lpage>46</lpage>.</mixed-citation></ref>
<ref id="ref73"><label>73</label><mixed-citation publication-type="journal"><string-name><surname>Nanehkaran</surname> <given-names>YA</given-names></string-name>, <string-name><surname>Licai</surname> <given-names>Z</given-names></string-name>, <string-name><surname>Azarafza</surname> <given-names>M</given-names></string-name>, <string-name><surname>Talaei</surname> <given-names>S</given-names></string-name>, <string-name><surname>Jinxia</surname> <given-names>X</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>J</given-names></string-name>, <etal>et al.</etal> <article-title>The predictive model for COVID-19 pandemic plastic pollution by using deep learning method</article-title>. <source>Sci Rep [Internet]</source>. <year>2023</year>;<volume>13</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>14</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1038/s41598-023-31416-y">https://doi.org/10.1038/s41598-023-31416-y</ext-link></mixed-citation></ref>
<ref id="ref74"><label>74</label><mixed-citation publication-type="journal"><string-name><surname>Song</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Zheng</surname> <given-names>S</given-names></string-name>, <string-name><surname>Li</surname> <given-names>L</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>X</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>X</given-names></string-name>, <string-name><surname>Huang</surname> <given-names>Z</given-names></string-name>, <etal>et al.</etal> <article-title>Deep learning enables accurate diagnosis of novel coronavirus (COVID-19) with CT images</article-title>. <source>IEEE/ACM Trans Comput Biol Bioinforma</source>. <year>2021</year>;<volume>18</volume>(<issue>6</issue>):<fpage>2775</fpage>&#x2013;<lpage>80</lpage>.</mixed-citation></ref>
<ref id="ref75"><label>75</label><mixed-citation publication-type="journal"><string-name><surname>Jin</surname> <given-names>C</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>W</given-names></string-name>, <string-name><surname>Cao</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Xu</surname> <given-names>Z</given-names></string-name>, <string-name><surname>Tan</surname> <given-names>Z</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>X</given-names></string-name>, <etal>et al.</etal> <article-title>Development and evaluation of an artificial intelligence system for COVID-19 diagnosis</article-title>. <source>Nat Commun</source>. <year>2020</year>;<volume>11</volume>(<issue>1</issue>):<fpage>5088</fpage>.</mixed-citation></ref>
<ref id="ref76"><label>76</label><mixed-citation publication-type="journal"><string-name><surname>Ahsan</surname> <given-names>MM</given-names></string-name>, <string-name><surname>Alam</surname> <given-names>TE</given-names></string-name>, <string-name><surname>Trafalis</surname> <given-names>T</given-names></string-name>, <string-name><surname>Huebner</surname> <given-names>P</given-names></string-name>. <article-title>Deep MLP-CNN model using mixed-data to distinguish between COVID-19 and Non-COVID-19 patients</article-title>. <source>Symmetry (Basel)</source>. <year>2020</year>;<volume>12</volume>(<issue>9</issue>).</mixed-citation></ref>
<ref id="ref77"><label>77</label><mixed-citation publication-type="journal"><string-name><surname>Mao</surname> <given-names>Y</given-names></string-name>, <string-name><surname>He</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Liu</surname> <given-names>L</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>X</given-names></string-name>. <article-title>Disease classification based on eye movement features with decision tree and random forest</article-title>. <source>Front Neurosci</source>. <year>2020</year>;14:<fpage>1</fpage>&#x2013;<lpage>11</lpage>.</mixed-citation></ref>
<ref id="ref78"><label>78</label><mixed-citation publication-type="journal"><string-name><surname>Nosseir</surname> <given-names>A</given-names></string-name>, <string-name><surname>Shawky</surname> <given-names>MA</given-names></string-name>. <article-title>Automatic classifier for skin disease using k-NN and SVM</article-title>. <source>ICSIE-19: Proceedings of the 8th International Conference on Software and Information Engineering</source>. <year>2019</year>. p. <fpage>259</fpage>&#x2013;<lpage>62</lpage>.</mixed-citation></ref>
<ref id="ref79"><label>79</label><mixed-citation publication-type="journal"><string-name><surname>Khan</surname> <given-names>MA</given-names></string-name>, <string-name><surname>Ashraf</surname> <given-names>I</given-names></string-name>, <string-name><surname>Alhaisoni</surname> <given-names>M</given-names></string-name>, Damaševič<string-name><surname>ius</surname> <given-names>R</given-names></string-name>, <string-name><surname>Scherer</surname> <given-names>R</given-names></string-name>, <string-name><surname>Rehman</surname> <given-names>A</given-names></string-name>, <etal>et al.</etal> <article-title>Multimodal brain tumor classification using deep learning and robust feature selection: A machine learning application for radiologists</article-title>. <source>Diagnostics</source>. <year>2020</year>;<volume>10</volume>(<issue>8</issue>):<fpage>1</fpage>&#x2013;<lpage>19</lpage>.</mixed-citation></ref>
<ref id="ref80"><label>80</label><mixed-citation publication-type="journal"><string-name><surname>Amin</surname> <given-names>J</given-names></string-name>, <string-name><surname>Sharif</surname> <given-names>M</given-names></string-name>, <string-name><surname>Raza</surname> <given-names>M</given-names></string-name>, <string-name><surname>Yasmin</surname> <given-names>M</given-names></string-name>. <article-title>Detection of brain tumor based on features fusion and machine learning</article-title>. <source>J Ambient Intell Humaniz Comput</source>. <year>2024</year>;<volume>15</volume>(<issue>1</issue>):<fpage>983</fpage>&#x2013;<lpage>99</lpage>.</mixed-citation></ref>
<ref id="ref81"><label>81</label><mixed-citation publication-type="journal"><string-name><surname>Dai</surname> <given-names>X</given-names></string-name>, <string-name><surname>Spasic</surname> <given-names>I</given-names></string-name>, <string-name><surname>Meyer</surname> <given-names>B</given-names></string-name>, <string-name><surname>Chapman</surname> <given-names>S</given-names></string-name>, <string-name><surname>Andres</surname> <given-names>F</given-names></string-name>. <article-title>Melanoma skin cancer detection using deep learning and classical machine learning techniques: A hybrid approach</article-title>. <source>2019 Fourth International Conference on Fog and Mobile Edge Computing (FMEC 2019)</source>. <year>2019</year>. p. <fpage>301</fpage>&#x2013;<lpage>5</lpage>.</mixed-citation></ref>
<ref id="ref82"><label>82</label><mixed-citation publication-type="journal"><string-name><surname>Dhaliwal</surname> <given-names>J</given-names></string-name>, <string-name><surname>Erdman</surname> <given-names>L</given-names></string-name>, <string-name><surname>Drysdale</surname> <given-names>E</given-names></string-name>, <string-name><surname>Rinawi</surname> <given-names>F</given-names></string-name>, <string-name><surname>Muir</surname> <given-names>J</given-names></string-name>, <string-name><surname>Walters</surname> <given-names>TD</given-names></string-name>, <etal>et al.</etal> <article-title>Accurate classification of pediatric colonic inflammatory bowel disease subtype using a random forest machine learning classifier</article-title>. <source>J Pediatr Gastroenterol Nutr</source>. <year>2021</year>;<volume>72</volume>(<issue>2</issue>):<fpage>262</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref83"><label>83</label><mixed-citation publication-type="journal"><string-name><surname>Fathi</surname> <given-names>M</given-names></string-name>, <string-name><surname>Nemati</surname> <given-names>M</given-names></string-name>, <string-name><surname>Mohammadi</surname> <given-names>SM</given-names></string-name>, <string-name><surname>Abbasi-Kesbi</surname> <given-names>R</given-names></string-name>. <article-title>A machine learning approach based on SVM for classification of liver diseases</article-title>. <source>Biomed Eng - Appl Basis Commun</source>. <year>2020</year>;<volume>32</volume>(<issue>3</issue>):<fpage>1</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref84"><label>84</label><mixed-citation publication-type="journal"><string-name><surname>Kalaiselvi</surname> <given-names>T</given-names></string-name>, <string-name><surname>Padmapriya</surname> <given-names>ST</given-names></string-name>, <string-name><surname>Sriramakrishnan</surname> <given-names>P</given-names></string-name>, <string-name><surname>Somasundaram</surname> <given-names>K</given-names></string-name>. <article-title>Deriving tumor detection models using convolutional neural networks from MRI of human brain scans</article-title>. <source>Int J Inf Technol</source>. <year>2020</year>;<volume>12</volume>(<issue>2</issue>):<fpage>403</fpage>&#x2013;<lpage>8</lpage>.</mixed-citation></ref>
<ref id="ref85"><label>85</label><mixed-citation publication-type="journal"><string-name><surname>Usman</surname> <given-names>K</given-names></string-name>, <string-name><surname>Rajpoot</surname> <given-names>K</given-names></string-name>. <article-title>Brain tumor classification from multi-modality MRI using wavelets and machine learning</article-title>. <source>Pattern Anal Appl</source>. <year>2017</year>;<volume>20</volume>(<issue>3</issue>):<fpage>871</fpage>&#x2013;<lpage>81</lpage>.</mixed-citation></ref>
<ref id="ref86"><label>86</label><mixed-citation publication-type="journal"><string-name><surname>Waheed</surname> <given-names>Z</given-names></string-name>, <string-name><surname>Waheed</surname> <given-names>A</given-names></string-name>, <string-name><surname>Zafar</surname> <given-names>M</given-names></string-name>, <string-name><surname>Riaz</surname> <given-names>F</given-names></string-name>. <article-title>An efficient machine learning approach for the detection of melanoma using dermoscopic images</article-title>. <source>2017 3rd IEEE International Conference on Computer and Communications (ICCC), Chengdu, China</source>. <year>2017</year>. pp. <fpage>316</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref87"><label>87</label><mixed-citation publication-type="journal"><string-name><surname>Shalu, Kamboj</surname> <given-names>A</given-names></string-name>. <source>A color-based approach for melanoma skin cancer detection. 2018 First International Conference on Secure Cyber Computing and Communication (ICSCCC), Jalandhar, India</source>. <year>2018</year>. pp. <fpage>508</fpage>&#x2013;<lpage>13</lpage>.</mixed-citation></ref>
<ref id="ref88"><label>88</label><mixed-citation publication-type="journal"><string-name><surname>Magalhaes</surname> <given-names>C</given-names></string-name>, <string-name><surname>Tavares</surname> <given-names>JMRS</given-names></string-name>, <string-name><surname>Mendes</surname> <given-names>J</given-names></string-name>, <string-name><surname>Vardasca</surname> <given-names>R</given-names></string-name>. <article-title>Comparison of machine learning strategies for infrared thermography of skin cancer</article-title>. <source>Biomed Signal Process Control</source>. <year>2021</year>;<volume>69</volume>:<fpage>102872</fpage>.</mixed-citation></ref>
<ref id="ref89"><label>89</label><mixed-citation publication-type="journal"><string-name><surname>Chen</surname> <given-names>M</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>B</given-names></string-name>, <string-name><surname>Topatana</surname> <given-names>W</given-names></string-name>, <string-name><surname>Cao</surname> <given-names>J</given-names></string-name>, <string-name><surname>Zhu</surname> <given-names>H</given-names></string-name>, <string-name><surname>Juengpanich</surname> <given-names>S</given-names></string-name>, <etal>et al.</etal> <article-title>Classification and mutation prediction based on histopathology H&amp;E images in liver cancer using deep learning</article-title>. <source>npj Precis Oncol</source>. <year>2020</year>;<volume>4</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>7</lpage>.</mixed-citation></ref>
<ref id="ref90"><label>90</label><mixed-citation publication-type="journal"><string-name><surname>Wang</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Ji</surname> <given-names>C</given-names></string-name>, <string-name><surname>Wang</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Ji</surname> <given-names>M</given-names></string-name>, <string-name><surname>Yang</surname> <given-names>JJ</given-names></string-name>, <string-name><surname>Zhou</surname> <given-names>CM</given-names></string-name>. <article-title>Predicting postoperative liver cancer death outcomes with machine learning</article-title>. <source>Curr Med Res Opin</source>. <year>2021</year>;<volume>37</volume>(<issue>4</issue>):<fpage>629</fpage>&#x2013;<lpage>34</lpage>.</mixed-citation></ref>
<ref id="ref91"><label>91</label><mixed-citation publication-type="journal"><string-name><surname>Taylor</surname> <given-names>RA</given-names></string-name>, <string-name><surname>Pare</surname> <given-names>JR</given-names></string-name>, <string-name><surname>Venkatesh</surname> <given-names>AK</given-names></string-name>, <string-name><surname>Mowafi</surname> <given-names>H</given-names></string-name>, <string-name><surname>Melnick</surname> <given-names>ER</given-names></string-name>, <string-name><surname>Fleischman</surname> <given-names>W</given-names></string-name>, <etal>et al.</etal> <article-title>Prediction of in-hospital mortality in emergency department patients with sepsis: a local big data-driven, machine learning approach</article-title>. <source>Acad Emerg Med</source>. <year>2016</year>;23:<fpage>269</fpage>&#x2013;<lpage>78</lpage>.</mixed-citation></ref>
<ref id="ref92"><label>92</label><mixed-citation publication-type="journal"><string-name><surname>Stanley</surname> <given-names>KO</given-names></string-name>, <string-name><surname>Clune</surname> <given-names>J</given-names></string-name>, <string-name><surname>Lehman</surname> <given-names>J</given-names></string-name>, <string-name><surname>Miikkulainen</surname> <given-names>R</given-names></string-name>. <article-title>Designing neural networks through neuroevolution</article-title>. <source>Nat Mach Intell</source>. <year>2019</year>;<volume>1</volume>(<issue>1</issue>):<fpage>24</fpage>&#x2013;<lpage>35</lpage>.</mixed-citation></ref>
<ref id="ref93"><label>93</label><mixed-citation publication-type="journal"><string-name><surname>Said</surname> <given-names>A</given-names></string-name>. <article-title>Bioinformatics and machine learning: analyzing genomic data for personalized medicine</article-title>. <source>Department of Computer Science, University of Cambridge</source>. <year>2023</year>:<fpage>1</fpage>&#x2013;<lpage>28</lpage>.</mixed-citation></ref>
<ref id="ref94"><label>94</label><mixed-citation publication-type="journal"><string-name><surname>Pawar</surname> <given-names>V</given-names></string-name>, <string-name><surname>Patil</surname> <given-names>A</given-names></string-name>, <string-name><surname>Tamboli</surname> <given-names>F</given-names></string-name>, <string-name><surname>Gaikwad</surname> <given-names>D</given-names></string-name>, <string-name><surname>Mali</surname> <given-names>D</given-names></string-name>, <string-name><surname>Shinde</surname> <given-names>A</given-names></string-name>. <article-title>Harnessing the power of AI in pharmacokinetics and pharmacodynamics: a comprehensive review</article-title>. <source>Int J Pharm Qual Assur</source>. <year>2023</year>;<volume>14</volume>(<issue>2</issue>):<fpage>426</fpage>&#x2013;<lpage>39</lpage>.</mixed-citation></ref>
<ref id="ref95"><label>95</label><mixed-citation publication-type="journal"><string-name><surname>Morota</surname> <given-names>G</given-names></string-name>, <string-name><surname>Ventura</surname> <given-names>RV</given-names></string-name>, <string-name><surname>Silva</surname> <given-names>FF</given-names></string-name>, <string-name><surname>Koyama</surname> <given-names>M</given-names></string-name>, <string-name><surname>Fernando</surname> <given-names>SC</given-names></string-name>. <article-title>Big data analytics and precision animal agriculture symposium: Machine learning and data mining advance predictive big data analysis in precision animal agriculture</article-title>. <source>J Anim Sci</source>. <year>2018</year>;<volume>96</volume>(<issue>4</issue>):<fpage>1540</fpage>&#x2013;<lpage>50</lpage>.</mixed-citation></ref>
<ref id="ref96"><label>96</label><mixed-citation publication-type="journal"><string-name><surname>Thirunavukarasu</surname> <given-names>AJ</given-names></string-name>, <string-name><surname>Ting</surname> <given-names>DSJ</given-names></string-name>, <string-name><surname>Elangovan</surname> <given-names>K</given-names></string-name>, <string-name><surname>Gutierrez</surname> <given-names>L</given-names></string-name>, <string-name><surname>Tan</surname> <given-names>TF</given-names></string-name>, <string-name><surname>Ting</surname> <given-names>DSW</given-names></string-name>. <article-title>Large language models in medicine</article-title>. <source>Nat Med</source>. <year>2023</year>;<volume>29</volume>(<issue>8</issue>):<fpage>1930</fpage>&#x2013;<lpage>40</lpage>.</mixed-citation></ref>
<ref id="ref97"><label>97</label><mixed-citation publication-type="journal"><string-name><surname>Rane</surname> <given-names>NL</given-names></string-name>, <string-name><surname>Tawde</surname> <given-names>A</given-names></string-name>, <string-name><surname>Choudhary</surname> <given-names>SP</given-names></string-name>, <string-name><surname>Rane</surname> <given-names>J</given-names></string-name>. <article-title>Contribution and performance of ChatGPT and other Large Language Models (LLM) for scientific and research advancements: a double-edged sword</article-title>. <source>Int Res J Mod Eng Technol Sci</source>. <year>2023</year>;<volume>5</volume>(<issue>10</issue>):<fpage>875</fpage>&#x2013;<lpage>99</lpage>.</mixed-citation></ref>
<ref id="ref98"><label>98</label><mixed-citation publication-type="journal"><string-name><surname>Nuthakki</surname> <given-names>S</given-names></string-name>. <article-title>Conversational AI and LLM&#x2019;S current and future impacts in improving and scaling health services</article-title>. <source>Int J Comput Eng Technol</source>. <year>2023</year>;14:<fpage>149</fpage>&#x2013;<lpage>55</lpage>.</mixed-citation></ref>
</ref-list>
</back>
</article>