<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "http://jats.nlm.nih.gov/publishing/1.3/JATS-journalpublishing1-3.dtd">
<article article-type="review-article" dtd-version="1.3" xml:lang="en" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="nlm-ta">PJAI</journal-id>
<journal-id journal-id-type="publisher-id">Premier Journal of Artificial Intelligence</journal-id>
<journal-id journal-id-type="pmc">PJAI</journal-id>
<journal-title-group>
<journal-title>PJ Artificial Intelligence</journal-title>
</journal-title-group>
<issn pub-type="epub">2977-5795</issn>
<publisher>
<publisher-name>Premier Science</publisher-name>
<publisher-loc>London, UK</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.70389/PJAI.100018</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>REVIEW</subject>
</subj-group>
<subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Cognitive science</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Social sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Sensory perception</subject><subj-group><subject>Hallucinations</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Social sciences</subject><subj-group><subject>Linguistics</subject><subj-group><subject>Grammar</subject><subj-group><subject>Phonology</subject><subj-group><subject>Syllables</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Engineering and technology</subject><subj-group><subject>Signal processing</subject><subj-group><subject>Speech signal processing</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Cognitive science</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Social sciences</subject><subj-group><subject>Psychology</subject><subj-group><subject>Cognitive psychology</subject><subj-group><subject>Perception</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Sensory perception</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Mental health and psychiatry</subject><subj-group><subject>Schizophrenia</subject></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Bioassays and physiological analysis</subject><subj-group><subject>Electrophysiological techniques</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Physiology</subject><subj-group><subject>Electrophysiology</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Brain mapping</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Clinical medicine</subject><subj-group><subject>Clinical neurophysiology</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject><subj-group><subject>Event-related potentials</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Cell biology</subject><subj-group><subject>Cellular types</subject><subj-group><subject>Animal cells</subject><subj-group><subject>Neurons</subject><subj-group><subject>Interneurons</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Cellular neuroscience</subject><subj-group><subject>Neurons</subject><subj-group><subject>Interneurons</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Bioassays and physiological analysis</subject><subj-group><subject>Electrophysiological techniques</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Physiology</subject><subj-group><subject>Electrophysiology</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neurophysiology</subject><subj-group><subject>Brain electrophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Brain mapping</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Medicine and health sciences</subject><subj-group><subject>Clinical medicine</subject><subj-group><subject>Clinical neurophysiology</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Research and analysis methods</subject><subj-group><subject>Imaging techniques</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group><subj-group subj-group-type="Discipline-v3">
<subject>Biology and life sciences</subject><subj-group><subject>Neuroscience</subject><subj-group><subject>Neuroimaging</subject><subj-group><subject>Electroencephalography</subject></subj-group></subj-group></subj-group></subj-group>
</article-categories>
<title-group>
<article-title>Energy Load Forecasting with Machine Learning: Models, Metrics, and Future Directions</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Manzoor</surname>
<given-names>Muhammad Faraz</given-names>
</name>
<role content-type="http://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
<role content-type="http://credit.niso.org/contributor-roles/Writing-original-draft/">Writing &#x2013; original draft</role>
<role content-type="http://credit.niso.org/contributor-roles/review-editing/">Review and editing</role>
</contrib>
<aff id="aff1"><institution>Department of Artificial Intelligence, University of Management and Technology</institution>, <city>Lahore</city>, <country>Pakistan</country></aff>
</contrib-group>
<author-notes>
<corresp id="cor001"><bold>Correspondence to:</bold> Muhammad Faraz Manzoor, <email>Faraz.manzoor@umt.edu.pk</email></corresp>
</author-notes>
<pub-date pub-type="epub">
<day>05</day>
<month>08</month>
<year>2025</year>
</pub-date>
<pub-date pub-type="collection">
<month>08</month>
<year>2025</year>
</pub-date>
<volume>4</volume>
<issue>1</issue>
<elocation-id>100018</elocation-id>
<history>
<date date-type="received">
<day>15</day>
<month>06</month>
<year>2025</year>
</date>
<date date-type="rev-recd">
<day>05</day>
<month>07</month>
<year>2025</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>07</month>
<year>2025</year>
</date>
</history>
<permissions>
<copyright-year>2025</copyright-year>
<copyright-holder>Muhammad Faraz Manzoor</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">
<license-p>This is an open access article distributed under the terms of the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/" xlink:type="simple">Creative Commons Attribution License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original author and source are credited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="info:doi/10.70389/PJAI.100018"/>
<abstract>
<p>Energy load forecasting plays a crucial role in the efficient management and operation of smart grids, enabling utilities to optimize energy distribution and improve grid reliability. Recent advancements in machine learning (ML) techniques have significantly enhanced the accuracy and adaptability of energy load prediction models. This review explores various ML models used for energy load forecasting, including traditional models, deep learning approaches such as long short-term memory (LSTM) networks and gated recurrent units (GRUs), and ensemble methods. The review discusses the strengths and limitations of each approach, highlighting its applicability to different forecasting timeframes and data characteristics. Additionally, it examines the performance evaluation metrics commonly used to assess model accuracy and reliability. Although multiple studies have examined forecasting techniques, there is a lack of comprehensive evaluation that connects model choice with practical deployment constraints such as data quality, real-time scalability, and interpretability. This review addresses this gap by systematically analyzing the challenges and emerging solutions in the context of smart grid applications. Despite the progress made, challenges related to data quality, computational complexity, and model interpretability remain significant barriers. The review concludes with an exploration of emerging trends and future directions in energy load forecasting, including hybrid models, federated learning, and reinforcement learning, which offer promising solutions to overcome existing limitations and improve forecasting performance in smart grid systems. Overall, the findings suggest that while no single model is universally optimal, integrating external factors, improving data quality, and adopting hybrid or explainable artificial intelligence (AI) approaches are critical for building more accurate, scalable, and interpretable forecasting systems.</p>
</abstract>
<kwd-group kwd-group-type="author">
<kwd>Energy load forecasting</kwd>
<kwd>Smart grids</kwd>
<kwd>Deep learning models</kwd>
<kwd>Ensemble methods</kwd>
<kwd>Predictive accuracy</kwd>
</kwd-group>
<counts>
<fig-count count="13"/>
<table-count count="11"/>
<equation-count count="10"/>
<page-count count="16"/>
</counts>
</article-meta>
</front>
<body>
<sec>
<title><ext-link ext-link-type="uri" xlink:href="https://premierscience.com/wp-content/uploads/2025/04/pjai-25-1017.pdf">Source-File: pjai-25-1017.pdf</ext-link></title>
</sec>
<sec id="sec001" sec-type="intro">
<title>Introduction</title>
<p>Energy load forecasting is important in smart grid management for the purpose of optimal demand side planning, resource and energy allocation, and cost optimization.<sup><xref ref-type="bibr" rid="ref1">1</xref></sup> The accuracy of prediction has been shown to be a necessity due to the growing integration of renewables and demand for more electricity. However, existing traditional forecasting methods, from statistical and econometric models, have limited success in generating such nonlinear and dynamic energy consumption patterns.<sup><xref ref-type="bibr" rid="ref2">2</xref></sup> In this context, machine learning (ML) is known as a game changer in the field, providing the ability to learn from historical consumption data and external factors to improve forecasting accuracy.</p>
<p>To better understand forecasting strategies, it is important to distinguish between types of energy load demands. Energy load forecasting can be further categorized based on specific end-use types such as cooling, heating, and general electricity demand, each having distinct characteristics and influencing factors. Cooling load forecasting is highly sensitive to outdoor air temperature and solar radiation, with significant variations during summer months and in commercial buildings. Heating load forecasting, on the other hand, is more influenced by low temperatures and seasonal shifts in winter, especially in residential zones. General electricity demand forecasting, while encompassing both heating and cooling needs, also includes lighting, appliances, and industrial usage patterns. These differences necessitate tailored forecasting models that account for the unique drivers and temporal patterns associated with each load type.</p>
<sec id="sec001-1">
<title>Importance of Energy Load Forecasting in Smart Grids</title>
<p>In order to balance supply and demand and to minimize operational costs and improve energy efficiency, smart grids are based on accurate energy load forecasting. This enables utility companies to generate power appropriately and not face energy crises or get dependent on backup power sources. Forecasting also provides for grid stability by knowing when peak demand will occur, and the supply is changed accordingly.<sup><xref ref-type="bibr" rid="ref3">3</xref></sup> As smart grids integrate more distributed energy resources, such as solar and wind power, forecasting becomes even more critical to manage intermittent generation and ensure grid reliability. If there is no right forecasting, energy providers might face supply versus transport mismatch, high operational cost, and poor energy distribution.<sup><xref ref-type="bibr" rid="ref4">4</xref></sup></p>
</sec>
<sec id="sec001-2">
<title>Role of ML in Improving Forecasting Accuracy</title>
<p>ML has revolutionized energy load forecasting by addressing the limitations of traditional methods,<sup><xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref></sup> Reinforcement Learning (RL) models are different from statistical models, which presume that data has a particular form to be modeled, but ML techniques can learn complicated patterns in data from history without preprogrammed declaration.<sup><xref ref-type="bibr" rid="ref7">7</xref></sup> Past consumption trends can be analyzed in a robust way that gives good predictions using supervised learning models like decision tree (DT) or random forest.<sup><xref ref-type="bibr" rid="ref8">8</xref></sup> Deep learning (DL) models, including the long short-term memory (LSTM) network and gated recurrent unit (GRU), excel in capturing long-term dependencies and seasonal variations. Moreover, hybrid models consisting of multiple ML techniques have demonstrated great potential in further increasing forecasting performance. By incorporating real-time data along with socioeconomic and weather-related factors, ML-based approaches offer a more responsive and precise method for forecasting energy load.<sup><xref ref-type="bibr" rid="ref9">9</xref></sup></p>
</sec>
<sec id="sec001-3">
<title>Scope and Objective of the Review</title>
<p>This review examines smart grid energy load forecasting using a succinct but comprehensive discussion of ML techniques to predict the energy load in this smart grid. This is to evaluate the effectiveness of different ML models and how well they can predict performance and its limitations. In this context, a summary of certain advantages of using ML in forecasting and some of the implementation challenges and possible future research directions is presented. This study synthesizes the recent advancements in the field and proposes insights into how ML can enable smart grids to operate with higher efficiency and reliability, thus helping to adopt more sustainable energy management practices.</p>
<p>To guide the reader, the structure of the review is as follows: Section Research Methodology outlines the methodology adopted for this study, including the systematic literature review (SLR) process, search strategy, selection criteria, and inclusion/exclusion parameters. Section ML Techniques for Energy Load Forecasting presents a detailed literature review of ML techniques applied to energy load forecasting. Section Comparison of Predictive Techniques and Common Evaluation Metrics provides a comparative analysis of various forecasting methods, including traditional models, DL architectures, and ensemble techniques, evaluating their performance across different forecasting scenarios. Section Challenges and Future Directions discusses the key challenges, such as data quality, computational demands, and interpretability, and outlines future directions, including hybrid approaches, federated learning, and RL. Finally, Section Conclusion concludes the review by summarizing the main findings and emphasizing the need for continued research to enhance the accuracy and robustness of energy load forecasting in smart grids.</p>
</sec>
</sec>
<sec id="sec002">
<title>Research Methodology</title>
<p>This study follows a SLR methodology to comprehensively analyze existing research on energy load forecasting techniques, as shown in <xref ref-type="fig" rid="F1">Figure 1</xref>. The methodology is structured to ensure transparency, reproducibility, and rigor in identifying, evaluating, and synthesizing relevant studies on ML models applied to energy load forecasting.<sup><xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref></sup></p>
<fig id="F1" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g001</object-id>
<label>Fig 1</label>
<caption><title>Systematic review process</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-1.jpg?">Figure 1</ext-link></p>
</fig>
<sec id="sec002-1">
<title>Research Objective (RO) and Research Question (RQ) Formulation</title>
<p>This study uses a structured framework of ROs, RQs, and motivations to define the focus of the study in energy load forecasting, as shown in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap id="T1">
<label>Table 1</label>
<caption><title>ROs and RQs mapping</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">SR#</th>
<th valign="top" align="left">RO</th>
<th valign="top" align="left">RQ</th>
<th valign="top" align="left">Motivation</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Identify and analyze the most commonly used ML and DL techniques for energy load forecasting.</td>
<td valign="top" align="left">What are the most frequently applied ML and DL techniques for energy load forecasting?</td>
<td valign="top" align="left">Understanding the dominant models helps in recognizing methodological trends, strengths, and limitations, which can guide future research and practical deployment.</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">Examine the primary application areas, forecasting timeframes, and data types used in energy load prediction.</td>
<td valign="top" align="left">In what contexts, time horizons, and data environments is energy load forecasting commonly applied?</td>
<td valign="top" align="left">Analyzing use cases across different settings highlights domain-specific requirements, temporal challenges, and data dependency of forecasting models.</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Investigate the key challenges in energy load forecasting and explore future directions to improve accuracy and scalability.</td>
<td valign="top" align="left">What are the major challenges in energy load forecasting, and what future directions can enhance model performance?</td>
<td valign="top" align="left">Identifying core challenges and emerging solutions can improve accuracy, real-time feasibility, and interpretability of forecasting systems in smart grids.</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec002-2">
<title>Literature Search Strategy</title>
<p>A search string was formulated to ensure that the search process captured only systematic and comprehensive studies relevant to energy load forecasting. The search string was designed to target literature focusing on the application of ML and DL techniques in forecasting energy consumption across various time horizons and contexts. The keywords and Boolean operators were defined as follows:</p>
<p><italic>(&#x201C;energy load forecasting&#x201D; OR &#x201C;electricity demand forecasting&#x201D; OR &#x201C;power load prediction&#x201D;) AND (&#x201C;machine learning&#x201D; OR &#x201C;deep learning&#x201D; OR &#x201C;time series prediction&#x201D;) AND (&#x201C;short-term&#x201D; OR &#x201C;long-term&#x201D; OR &#x201C;</italic><italic>real</italic><italic>-time&#x201D;) AND (&#x201C;smart grid&#x201D; OR &#x201C;energy systems&#x201D; OR &#x201C;utilities&#x201D;)</italic></p>
<p>This search string was applied across multiple academic databases, including IEEE Xplore, SpringerLink, ScienceDirect, and the Multidisciplinary Digital Publishing Institute (MDPI), to identify and collect relevant peer-reviewed articles.</p>
</sec>
<sec id="sec002-3">
<title>Study Selection Criteria</title>
<p>In order to limit the studies considered in this SLR to the most relevant and high-quality research, we applied a structured and multistage filtering process.<sup><xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref12">12</xref></sup> In this study, the selection was conducted in a sequential manner using rigorous screening at multiple levels, such as title-based screening, abstract-based filtering, and full-text review, as shown in <xref ref-type="fig" rid="F2">Figure 2</xref>. This process refined the selection to studies that contain direct contributions of data, models, or insights relevant to ML and DL techniques for energy load forecasting.<sup><xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref></sup></p>
<fig id="F2" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g002</object-id>
<label>Fig 2</label>
<caption><title>Study selection process</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-2.jpg?">Figure 2</ext-link></p>
</fig>
<sec id="sec002-3-1">
<title>Title-Based Screening</title>
<p>In the first step of the selection process, a title-based screening was applied to the studies, where they were assessed based on their titles. Shortlisted research articles explicitly referred to techniques related to energy load forecasting, electricity demand prediction, time series modeling, ML, and DL. Also, studies with vague, overly general, or unrelated titles were immediately excluded to retain only relevant literature focused on forecasting within energy systems.</p>
</sec>
<sec id="sec002-3-2">
<title>Abstract-Based Screening</title>
<p>After the title screening, the abstracts of the shortlisted papers were carefully reviewed to determine their relevance. If the study focused on ML or DL techniques specifically applied to energy load forecasting, then the study was included. It also prioritized papers discussing applications in smart grids, utility demand prediction, renewable energy integration, and real-time load management. Suitable for further review were abstracts that provided technical insights into model architectures, datasets used, and performance evaluation metrics. At this phase, studies that lacked technical depth, focused on unrelated domains, or did not employ data-driven forecasting methods were excluded.</p>
</sec>
<sec id="sec002-3-3">
<title>Full-Text Review</title>
<p>Full-text review of the remaining studies completed the last stage of the selection process. This was an important step to ensure that the selected papers clearly described their methodology, experimental setup, and analytical results. Articles were included if they provided quantitative performance evaluation in the form of metrics such as root mean squared error (RMSE), mean absolute error (MAE), mean absolute percentage error (MAPE), R-squared (<italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup>), or computational efficiency. Additionally, prioritized were studies that discussed challenges, limitations, and future research directions in the context of energy load forecasting. To improve the credibility and reliability of the reviewed literature, only articles published in high-impact journals or peer-reviewed conferences were considered. To ensure that only high-quality, methodologically sound, and impactful studies were included, papers with complete methodologies but lacking experimental validation, or those using outdated forecasting techniques, were excluded.</p>
</sec>
</sec>
<sec id="sec002-4">
<title>Inclusion and Exclusion Criteria</title>
<p>During the process of selecting high-quality and relevant studies, a set of predefined inclusion and exclusion criteria was applied to the study selection, as shown in <xref ref-type="table" rid="T2">Table 2</xref>. Refining the literature involved using these criteria to filter out studies that did not align with the ROs. In this SLR, the following specific inclusion and exclusion parameters were established, as detailed in the Table 2.</p>
<table-wrap id="T2">
<label>Table 2</label>
<caption><title>Inclusion exclusion criteria</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Criteria</th>
<th valign="top" align="left">Inclusion</th>
<th valign="top" align="left">Exclusion</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Study type</td>
<td valign="top" align="left">Peer-reviewed journal articles, conference papers, and high-impact workshop papers</td>
<td valign="top" align="left">Non-peer-reviewed articles, book chapters, theses, white papers, or blogs</td>
</tr>
<tr>
<td valign="top" align="left">Research focus</td>
<td valign="top" align="left">Studies focusing on ML and DL techniques for energy load forecasting</td>
<td valign="top" align="left">Studies focusing on general data analytics or unrelated ML tasks</td>
</tr>
<tr>
<td valign="top" align="left">Dataset availability</td>
<td valign="top" align="left">Papers that use publicly available datasets or provide details of proprietary datasets used for model training and evaluation</td>
<td valign="top" align="left">Studies that do not specify datasets, making comparison and validation difficult</td>
</tr>
<tr>
<td valign="top" align="left">Technical depth</td>
<td valign="top" align="left">Papers providing detailed methodology, including model architectures, training procedures, and performance evaluation metrics</td>
<td valign="top" align="left">Studies lacking methodological clarity or experimental validation</td>
</tr>
<tr>
<td valign="top" align="left">Language</td>
<td valign="top" align="left">Papers published in English</td>
<td valign="top" align="left">Papers published in languages other than English</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec002-5">
<title>Study Selection Results</title>
<p>A total of 45 papers were selected and analyzed to address the RQs outlined above. <xref ref-type="table" rid="T2">Table 2</xref> presents the distribution of studies based on their sources, while <xref ref-type="table" rid="T3">Table 3</xref> provides a detailed list of the selected papers.</p>
<table-wrap id="T3">
<label>Table 3</label>
<caption><title>Study selection results</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Phase</th>
<th valign="top" align="left">Process</th>
<th valign="top" align="left">Selection Stage</th>
<th valign="top" align="center">Elsevier</th>
<th valign="top" align="center">Springer</th>
<th valign="top" align="center">IEEE</th>
<th valign="top" align="center">MDPI</th>
<th valign="top" align="center">Others</th>
<th valign="top" align="center">Total</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Search</td>
<td valign="top" align="left">Search string</td>
<td valign="top" align="center">319</td>
<td valign="top" align="center">1900</td>
<td valign="top" align="center">4719</td>
<td valign="top" align="center">2400</td>
<td valign="top" align="center">349</td>
<td valign="top" align="center">9687</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">Screening</td>
<td valign="top" align="left">Title</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">79</td>
<td valign="top" align="center">70</td>
<td valign="top" align="center">104</td>
<td valign="top" align="center">45</td>
<td valign="top" align="center">330</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Screening</td>
<td valign="top" align="left">Abstract</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">106</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">Screening</td>
<td valign="top" align="left">Full text</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">45</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="sec003">
<title>ML Techniques for Energy Load Forecasting</title>
<p>ML techniques are used to model complex and nonlinear energy consumption patterns required by energy load forecasting. These techniques used historical data, real-time grid data, and external variables (weather, economic indicators) to leverage the prediction accuracy (<xref ref-type="fig" rid="F3">Figure 3</xref>). In general, these ML models are used: traditional ML models, DL models, and ensemble models. Each of these categories has advantages and challenges different enough to make it appropriate for a different forecasting scenario. Detailed discussion of these approaches is given in this section, including how they are applied, how effective they are, and how well they perform.</p>
<fig id="F3" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g003</object-id>
<label>Fig 3</label>
<caption><title>Taxonomy of techniques for energy load forecasting</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-3.jpg?">Figure 3</ext-link></p>
</fig>
<sec id="sec003-1">
<title>Traditional ML Models</title>
<p>Energy load forecasting has traditionally relied on interpretable and computationally efficient ML models that perform well with structured data. Common examples of such models include the linear regression (LR), DT, support vector machine (SVM), and random forest (RF). These models are favored for their transparency and ease of implementation, particularly in short-term forecasting scenarios. For instance, S&#x00F6;derberg and Meurling<sup><xref ref-type="bibr" rid="ref15">15</xref></sup> conducted a comparative study on various ML models, including regression analysis and DTs, for predicting household energy consumption, highlighting their effectiveness in capturing consumption patterns. Similarly, Lahouar et al.<sup><xref ref-type="bibr" rid="ref16">16</xref></sup> developed a one-day-ahead load forecasting model using regression RF, demonstrating its accuracy and robustness in short-term load prediction. These studies underline the practical value of traditional ML approaches, particularly when interpretability and quick deployment are critical.</p>
<sec id="sec003-1-1">
<title>Linear Regression (LR)</title>
<p>One of the simplest models for energy load forecasting is linear regression with the assumption that a relationship with input variables (e.g., past energy consumption, temperature) and output variable (future energy demand) is linear (<xref ref-type="fig" rid="F4">Figure 4</xref>). For example, Sarker et al.<sup><xref ref-type="bibr" rid="ref17">17</xref></sup> utilized linear regression combined with inverse matrix analysis to forecast energy demand in remote areas of Bangladesh, demonstrating its efficacy in regions with limited data availability. On the other hand, Mahmud<sup><xref ref-type="bibr" rid="ref18">18</xref></sup> employed linear regression analysis to predict electricity loads in isolated areas lacking historical data, underscoring the model&#x2019;s practicality in diverse settings. The model is represented as:</p>
<fig id="F4" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g004</object-id>
<label>Fig 4</label>
<caption><title>General mechanism of linear regression</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-4.jpg?">Figure 4</ext-link></p>
</fig>
<disp-formula id="M1"><label>(1)</label><mml:math id="DM1" display="block"><mml:mrow><mml:mi>Y</mml:mi><mml:mo>=</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mn>0</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:mstyle displaystyle='true'><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover><mml:mrow><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:msub><mml:mi>X</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03B5;</mml:mi></mml:mrow></mml:mstyle></mml:mrow></mml:math></disp-formula>
<p>where <italic>Y</italic> is the predicted energy load, <italic>X</italic><italic>i</italic> are input features, <italic>&#x03B2;</italic><italic>i</italic> are coefficients, and &#x03B5; represents error terms. While LR is computationally efficient, its main limitation is its inability to model complex, nonlinear relationships in energy demand.</p>
</sec>
<sec id="sec003-1-2">
<title>Decision Tree (DT)</title>
<p>As DTs partition the dataset based on feature importances, DTs become suitable for capturing nonlinear dependencies in energy load data (<xref ref-type="fig" rid="F5">Figure 5</xref>). DTs are good with categorical as well as numeric features, but are prone to overfitting, more so for deep tree structure. Likewise, Hambali et al.<sup><xref ref-type="bibr" rid="ref19">19</xref></sup> evaluated various DT algorithms for electric power load forecasting and found that the REPTree technique outperformed others, highlighting its effectiveness in handling nonlinear relationships in load data. Likewise, Jahan et al.<sup><xref ref-type="bibr" rid="ref20">20</xref></sup> designed a DT model using weather and power load data as inputs for short-term demand forecasting, demonstrating the model&#x2019;s capability to capture complex dependencies in energy consumption patterns.</p>
<fig id="F5" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g005</object-id>
<label>Fig 5</label>
<caption><title>General mechanism of DT</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-5.jpg?">Figure 5</ext-link></p>
</fig>
</sec>
<sec id="sec003-1-3">
<title>Support Vector Machine (SVM)</title>
<p>SVMs are effective for short-term load forecasting as they find an optimal hyperplane for classification or regression (<xref ref-type="fig" rid="F6">Figure 6</xref>). Furthermore, Tian and Noore<sup><xref ref-type="bibr" rid="ref21">21</xref></sup> proposed an SVM-based approach for short-term load forecasting, demonstrating improved generalization and lower prediction error compared to neural network methods. On the other side, Li and Fang<sup><xref ref-type="bibr" rid="ref22">22</xref></sup> applied SVMs to power system load forecasting, effectively enhancing forecasting accuracy. The model is based on:</p>
<fig id="F6" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g006</object-id>
<label>Fig 6</label>
<caption><title>General mechanism of SVM</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-6.jpg?">Figure 6</ext-link></p>
</fig>
<disp-formula id="M2"><label>(2)</label><mml:math id="DM2" display="block"><mml:mrow><mml:munder><mml:mrow><mml:mi>min</mml:mi></mml:mrow><mml:mrow><mml:mi>w</mml:mi><mml:mo>,</mml:mo><mml:mi>b</mml:mi><mml:mo>,</mml:mo><mml:mi>&#x03BE;</mml:mi></mml:mrow></mml:munder><mml:mfrac><mml:mn>1</mml:mn><mml:mn>2</mml:mn></mml:mfrac><mml:mo>&#x007C;</mml:mo><mml:mrow><mml:mo>|</mml:mo> <mml:mi>w</mml:mi> <mml:mo>|</mml:mo></mml:mrow><mml:msup><mml:mo>&#x007C;</mml:mo><mml:mn>2</mml:mn></mml:msup><mml:mo>+</mml:mo><mml:mi>C</mml:mi><mml:munderover><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover ><mml:msub><mml:mi>&#x03BE;</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:math></disp-formula>
<p>subject to constraints ensuring that predictions fall within an acceptable error margin. However, SVMs can be computationally expensive for large datasets.</p>
</sec>
<sec id="sec003-1-4">
<title>Random Forest (RF)</title>
<p>RF is an ensemble of DTs that serves the purposes of improving forecasting accuracy and reducing overfitting (<xref ref-type="fig" rid="F7">Figure 7</xref>). It merges the outputs from multiple trees, effectively improving robustness, and is a good candidate for energy load forecasting in dynamic ecosystems. Some researchers work on it like Dudek,<sup><xref ref-type="bibr" rid="ref23">23</xref></sup> who applied RF to short-term electricity load forecasting, demonstrating its ability to handle nonstationary and seasonal time series data effectively. Meanwhile, Gao et al.<sup><xref ref-type="bibr" rid="ref24">24</xref></sup> proposed an improved RF regression algorithm for ultra-short-term electricity load forecasting, achieving higher accuracy compared to traditional methods (<xref ref-type="table" rid="T4">Table 4</xref>).</p>
<fig id="F7" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g007</object-id>
<label>Fig 7</label>
<caption><title>General mechanism of RF</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-7.jpg?">Figure 7</ext-link></p>
</fig>
<table-wrap id="T4">
<label>Table 4</label>
<caption><title>Comparison of traditional ML models for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Weaknesses</th>
<th valign="top" align="left">Best For</th>
<th valign="top" align="left">Complexity</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Linear regression</td>
<td valign="top" align="left">Simple, interpretable</td>
<td valign="top" align="left">Cannot model nonlinear patterns</td>
<td valign="top" align="left">Baseline forecasting</td>
<td valign="top" align="left">Low</td>
<td valign="top" align="left">17,18</td>
</tr>
<tr>
<td valign="top" align="left">DTs</td>
<td valign="top" align="left">Handles categorical and numerical data well</td>
<td valign="top" align="left">Prone to overfitting</td>
<td valign="top" align="left">Medium-term forecasting</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">19,20</td>
</tr>
<tr>
<td valign="top" align="left">SVM</td>
<td valign="top" align="left">Robust to outliers</td>
<td valign="top" align="left">Computationally expensive</td>
<td valign="top" align="left">Short-term forecasting</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">21,22</td>
</tr>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="left">High accuracy, reduces overfitting</td>
<td valign="top" align="left">Less interpretable</td>
<td valign="top" align="left">Complex energy load patterns</td>
<td valign="top" align="left">Medium-High</td>
<td valign="top" align="left">23,24</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="sec003-2">
<title>DL Models</title>
<p>The growing popularity of DL models in energy load forecasting stems from their ability to capture long-term dependencies and model complex nonlinear relationships in energy consumption data. Notable models in this category include the artificial neural network (ANN), LSTM network, and GRU. Unlike traditional models, these architectures are capable of automatically extracting hierarchical features from raw time series data, making them particularly effective in scenarios with highly dynamic and temporally correlated consumption patterns.</p>
<sec id="sec003-2-1">
<title>Artificial Neural Networks (ANNs)</title>
<p>ANNs consist of multiple layers of neurons that learn energy consumption patterns from historical data (<xref ref-type="fig" rid="F8">Figure 8</xref>). Numerous researchers work on this model, including, Oreshkin et al.<sup><xref ref-type="bibr" rid="ref25">25</xref></sup> who introduced the N-BEATS neural network architecture, which demonstrated superior performance in mid-term electricity load forecasting across various European datasets. Similarly, Gao et al.<sup><xref ref-type="bibr" rid="ref26">26</xref></sup> proposed an ensemble deep random vector functional link (edRVFL) network, which achieved high accuracy in short-term load forecasting tasks by leveraging deep representation learning and ensemble strategies. The weight updates are as follows:</p>
<fig id="F8" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g008</object-id>
<label>Fig 8</label>
<caption><title>General mechanism of ANN</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-8.jpg?">Figure 8</ext-link></p>
</fig>
<disp-formula id="M3"><label>(3)</label><mml:math id="DM3" display="block"><mml:mrow><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03B7;</mml:mi><mml:mfrac><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:mi>E</mml:mi></mml:mrow><mml:mrow><mml:mo>&#x2202;</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>i</mml:mi><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mrow></mml:math></disp-formula>
<p>where <italic>w</italic><sub><italic>ij</italic></sub> are weights, <italic>&#x3b7;</italic> is the learning rate, and E is the error function. ANNs perform well for medium- to long-term load forecasting but require large datasets and high computational power.</p>
</sec>
<sec id="sec003-2-2">
<title>LSTM Networks</title>
<p>Energy load data are captured with temporal dependencies by LSTM networks, a type of recurrent neural network (RNN). However, due to vanishing gradients in traditional RNNs, they overcome vanishing gradients through memory cells that store information for long periods (<xref ref-type="fig" rid="F9">Figure 9</xref>). However, the DA-LSTM framework introduced by Bayram et al.<sup><xref ref-type="bibr" rid="ref27">27</xref></sup> is a dynamic drift-adaptive learning model designed for interval load forecasting. This approach enhances forecasting accuracy by adapting to changes in consumption patterns without requiring predefined drift thresholds. Meanwhile, a hybrid LSTM model was developed by Lu et al.<sup><xref ref-type="bibr" rid="ref28">28</xref></sup> incorporating online correction mechanisms. Their model integrates temporal and nontemporal features and employs an online correction strategy to adjust to real-time data distribution shifts, thereby improving day-ahead load forecasting accuracy. The cell state update is given by:</p>
<fig id="F9" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g009</object-id>
<label>Fig 9</label>
<caption><title>General mechanism of LSTM</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-9.jpg?">Figure 9</ext-link></p>
</fig>
<disp-formula id="M4"><label>(4)</label><mml:math id="DM4" display="block"><mml:mrow><mml:msub><mml:mi>C</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>f</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>.</mml:mo><mml:msub><mml:mi>C</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>i</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>.</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>C</mml:mi><mml:mo>&#x02DC;</mml:mo></mml:mover><mml:mi>t</mml:mi></mml:msub></mml:mrow></mml:math></disp-formula>
<p>where <italic>C</italic><sub><italic>t</italic></sub> is the cell state, <italic>C</italic><sub><italic>t</italic></sub> is the forget gate, and <italic>i</italic><sub><italic>t</italic></sub> is the input gate. LSTMs are highly effective for energy load forecasting due to their ability to recognize seasonality and trends.</p>
</sec>
<sec id="sec003-2-3">
<title>Gated Recurrent Units (GRUs)</title>
<p>The main difference between GRUs and LSTMs is that the former has a simpler architecture and therefore computational complexity (<xref ref-type="fig" rid="F10">Figure 10</xref>). The short-term dependency between the periods is balanced with the long-term dependency and therefore, it is a decent indication for real-time energy load forecasting. For example, Emshagin et al.<sup><xref ref-type="bibr" rid="ref29">29</xref></sup> developed customized LSTM and GRU models for short-term household electricity consumption prediction. Their study found that while both models effectively captured consumption patterns, LSTM slightly outperformed GRU in forecasting accuracy. Likewise, Dong and Grumbach<sup><xref ref-type="bibr" rid="ref30">30</xref></sup> introduced a hybrid long-term load forecasting method utilizing both LSTM and GRU networks. Their approach successfully integrated top-down, bottom-up, and sequential information, demonstrating the practicality of GRUs in capturing temporal dependencies in energy consumption data (<xref ref-type="table" rid="T5">Table 5</xref>).</p>
<fig id="F10" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g010</object-id>
<label>Fig 10</label>
<caption><title>General mechanism of GRU</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-10.jpg?">Figure 10</ext-link></p>
</fig>
<table-wrap id="T5">
<label>Table 5</label>
<caption><title>Comparison of DL models for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Weaknesses</th>
<th valign="top" align="left">Best For</th>
<th valign="top" align="left">Complexity</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">ANN</td>
<td valign="top" align="left">Captures nonlinear relationships</td>
<td valign="top" align="left">Requires large datasets</td>
<td valign="top" align="left">Medium-term forecasting</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">25,26</td>
</tr>
<tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="left">Models long-term dependencies</td>
<td valign="top" align="left">Computationally expensive</td>
<td valign="top" align="left">Long-term forecasting</td>
<td valign="top" align="left">Very High</td>
<td valign="top" align="left">27,28</td>
</tr>
<tr>
<td valign="top" align="left">GRU</td>
<td valign="top" align="left">Simplifies LSTM with similar accuracy</td>
<td valign="top" align="left">May not capture complex dependencies</td>
<td valign="top" align="left">Real-time forecasting</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">29,30</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="sec003-3">
<title>Ensemble Approaches</title>
<p>Ensemble learning combines the predictive strengths of multiple models to improve forecasting accuracy and reduce variance in predictions. This approach is particularly effective in addressing the limitations of individual models by aggregating their outputs. The common ensemble methods used for energy load forecasting include boosting, bagging, and hybrid models. Boosting techniques sequentially train models to correct errors of previous ones, while bagging methods reduce variance by averaging predictions across independently trained models. Hybrid models, on the other hand, integrate different algorithmic paradigms&#x2014;such as combining traditional and DL models&#x2014;to leverage the advantages of both.</p>
<sec id="sec003-3-1">
<title>Boosting Methods</title>
<p>Boosting methods, such as gradient boosting machines (GBMs), XGBoost, and AdaBoost, iteratively improve weak learners by focusing on difficult-to-predict instances (<xref ref-type="fig" rid="F11">Figure 11</xref>). A bagging model named XASXG proposed by, Ding et al.<sup><xref ref-type="bibr" rid="ref31">31</xref></sup> which integrates autoregressive integrated moving average (ARIMA), support vector regression (SVR), and XGBoost. This model effectively captures the nonstationary and nonlinear characteristics of electricity load time series, resulting in superior forecasting accuracy across various Chinese cities. Similarly, Rubattu et al.<sup><xref ref-type="bibr" rid="ref32">32</xref></sup> developed a predictive model utilizing probabilistic LightGBM combined with temporal hierarchies and advanced feature engineering. Their approach achieved high accuracy in the BigDeal Challenge 2022, demonstrating the efficacy of boosting methods in load and peak forecasting tasks. The loss function for boosting is:</p>
<fig id="F11" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g011</object-id>
<label>Fig 11</label>
<caption><title>General mechanism of boosting method</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-11.jpg?">Figure 11</ext-link></p>
</fig>
<disp-formula id="M5"><label>(5)</label><mml:math id="DM5" display="block"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mi>F</mml:mi><mml:mrow><mml:mi>m</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>+</mml:mo><mml:mi>&#x03B3;</mml:mi><mml:msub><mml:mi>h</mml:mi><mml:mi>m</mml:mi></mml:msub><mml:mrow><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:mrow></mml:math></disp-formula>
<p>where <italic>F</italic><italic>m</italic> (<italic>x</italic>) is the current model, <italic>h</italic><italic>m</italic> (<italic>x</italic>) is the new weak learner, and <italic>&#x03B3;</italic> is a learning rate. These methods enhance accuracy but may suffer from overfitting if not carefully tuned.</p>
</sec>
<sec id="sec003-3-2">
<title>Bagging Methods</title>
<p>To reduce variance and improve stability, bagging techniques such as RF and bootstrap aggregation perform a number of versions of the training dataset (<xref ref-type="fig" rid="F12">Figure 12</xref>). Thus, these models are good at handling fluctuating energy demand patterns. A cluster-based bootstrapping method was introduced by Dube et al.<sup><xref ref-type="bibr" rid="ref33">33</xref></sup> for interval prediction of electricity demand. Their approach utilizes residual bootstrapping combined with unsupervised clustering to generate accurate interval forecasts, particularly beneficial in microgrid settings with high demand variability. Additionally, the BaggingSHAP model, which was proposed by Olumba et al.,<sup><xref ref-type="bibr" rid="ref34">34</xref></sup> combines bagging combines bagging with SHapley Additive exPlanations (SHAP) for enhanced interpretability in energy demand forecasting. The model achieved an <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> score of 0.9947, indicating superior predictive performance.</p>
<fig id="F12" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g012</object-id>
<label>Fig 12</label>
<caption><title>General mechanism of bagging method</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-12.jpg?">Figure 12</ext-link></p>
</fig>
</sec>
<sec id="sec003-3-3">
<title>Hybrid Models</title>
<p>Traditional forecasting techniques are combined with the DL approaches using hybrid models to optimize the forecasting performance (<xref ref-type="fig" rid="F13">Figure 13</xref>). As an example, RF and LSTM can be used together by an RF-LSTM model to select features with RF, apply LSTM to temporal pattern recognition while remaining both interpretable and accurate. Meanwhile, Zhang et al.<sup><xref ref-type="bibr" rid="ref35">35</xref></sup> proposed a hybrid model combining RF and LSTM to improve short-term electricity load forecasting, demonstrating reduced prediction errors compared to standalone models. Similarly, Ma et al.<sup><xref ref-type="bibr" rid="ref36">36</xref></sup> developed a hybrid RF-LSTM approach that leveraged RF for selecting the most relevant input features and LSTM for modeling sequential dependencies, achieving superior results in multistep energy load forecasting tasks (<xref ref-type="table" rid="T6">Table 6</xref>).</p>
<fig id="F13" position="float">
<object-id pub-id-type="doi">10.70389/journal.PJAI.100018.g013</object-id>
<label>Fig 13</label>
<caption><title>General mechanism of hybrid models</title></caption>
<p><ext-link ext-link-type="uri" xlink:href="https://i0.wp.com/premierscience.com/wp-content/uploads/2025/04/pjai-25-1017-Figure-13.jpg?">Figure 13</ext-link></p>
</fig>
<table-wrap id="T6">
<label>Table 6</label>
<caption><title>Comparison of ensemble approaches for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Weaknesses</th>
<th valign="top" align="left">Best For</th>
<th valign="top" align="left">Complexity</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Boosting (XGBoost, AdaBoost)</td>
<td valign="top" align="left">Improves weak learners iteratively</td>
<td valign="top" align="left">May overfit</td>
<td valign="top" align="left">High-variance energy patterns</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">31,32</td>
</tr>
<tr>
<td valign="top" align="left">Bagging (RF)</td>
<td valign="top" align="left">Reduces variance, robust</td>
<td valign="top" align="left">Less interpretable</td>
<td valign="top" align="left">Medium-term forecasting</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">33,34</td>
</tr>
<tr>
<td valign="top" align="left">Hybrid (RF-LSTM)</td>
<td valign="top" align="left">Leverages best of both models</td>
<td valign="top" align="left">High computational cost</td>
<td valign="top" align="left">Long-term forecasting</td>
<td valign="top" align="left">Very High</td>
<td valign="top" align="left">35,36</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Ensemble methods provide a robust solution for energy load forecasting, particularly when dealing with fluctuating consumption patterns and large-scale smart grid data. They enhance forecasting accuracy by reducing bias and variance while leveraging the strengths of multiple models.</p>
</sec>
</sec>
</sec>
<sec id="sec004">
<title>Comparison of Predictive Techniques and Common Evaluation Metrics</title>
<p>The effectiveness of predictive techniques in energy load forecasting largely depends on the accuracy, reliability, and efficiency of the ML models employed. Selecting the appropriate technique requires evaluating which model performs best based on specific performance metrics, while also considering the trade-offs associated with each approach. This section reviews commonly used ML models for energy load forecasting and provides a comparative analysis of their strengths and limitations with respect to various evaluation metrics.</p>
<sec id="sec004-1">
<title>Performance Metrics Used for Evaluation</title>
<p>There have been diverse performance metrics used to assess the predictive accuracy and reliability of the ML models used in energy load forecasting. This is useful in determining how well the model will minimize errors, and if it can be applied to average real-world problems. Mean squared error (MSE), RMSE, MAE, MAPE, and <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> are the most common performance metrics.</p>
<sec id="sec004-1-1">
<title>Mean Squared Error (MSE)</title>
<p>MSE measures the average squared difference between predicted and actual values, with a focus on penalizing larger errors more than smaller ones. According to, Chai and Draxler<sup><xref ref-type="bibr" rid="ref37">37</xref></sup> MSE is a commonly preferred metric in regression tasks due to its mathematical simplicity and sensitivity to large deviations. Likewise, Willmott and Matsuura<sup><xref ref-type="bibr" rid="ref38">38</xref></sup> compared MSE with MAE, emphasizing MSE&#x2019;s utility when highlighting significant prediction errors is crucial in model evaluation. It is calculated as:</p>
<disp-formula id="M6"><label>(6)</label><mml:math id="DM6" display="block"><mml:mrow><mml:mi>M</mml:mi><mml:mi>S</mml:mi><mml:mi>E</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:munderover><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover ><mml:msup><mml:mrow><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x005E;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy='false'>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:math></disp-formula>
<p><italic>&#x302;</italic></p>
<p>where <italic>y</italic><italic>i</italic> is the actual value, <italic>&#x177;</italic><italic>i</italic> is the predicted value, and <italic>n</italic> is the total number of data points. MSE is sensitive to outliers, as it squares the error terms, which can lead to a disproportionate influence of large errors.</p>
</sec>
<sec id="sec004-1-2">
<title>Root Mean Squared Error (RMSE)</title>
<p>RMSE is the square root of the MSE and provides a more interpretable error metric in the original units of the data. As highlighted by, Hyndman and Koehler<sup><xref ref-type="bibr" rid="ref39">39</xref></sup> RMSE is particularly useful when large prediction errors are undesirable, offering a balance between interpretability and sensitivity. Meanwhile, Hong et al.<sup><xref ref-type="bibr" rid="ref40">40</xref></sup> emphasized the importance of RMSE in energy forecasting competitions due to its ability to reflect forecasting accuracy effectively across different models and datasets. It is calculated as:</p>
<disp-formula id="M7"><label>(7)</label><mml:math id="DM7" display="block"><mml:mrow><mml:mtext>RMSE</mml:mtext><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:munderover><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover ><mml:msup><mml:mrow><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x005E;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy='false'>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:msqrt></mml:mrow></mml:math></disp-formula>
<p><italic>&#x302;</italic></p>
<p>RMSE is widely used in energy load forecasting because it reflects the magnitude of the error in a way that is more understandable to practitioners. However, like MSE, it is also sensitive to large errors.</p>
</sec>
<sec id="sec004-1-3">
<title>Mean Absolute Error (MAE)</title>
<p>MAE measures the average magnitude of errors in a set of predictions, without considering their direction. However, Willmott et al.<sup><xref ref-type="bibr" rid="ref38">38</xref></sup> emphasized the interpretability and robustness of MAE in environmental and climate modeling contexts, showing its reliability across diverse datasets. However, Hyndman and Koehler<sup><xref ref-type="bibr" rid="ref39">39</xref></sup> discussed MAE as a reliable baseline metric in forecast accuracy comparisons, particularly useful when comparing models across datasets with different scales. It is given by:</p>
<disp-formula id="M8"><label>(8)</label><mml:math id="DM8" display="block"><mml:mrow><mml:mtext>MAE</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:munderover><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover ><mml:mo>&#x007C;</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x005E;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:msup><mml:mo>&#x007C;</mml:mo><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:math></disp-formula>
<p><italic>&#x302;</italic></p>
<p>MAE is less sensitive to outliers compared to MSE and RMSE, making it suitable for applications where large deviations are less critical. It provides a straightforward measure of how far the predictions are from the actual values on average.</p>
</sec>
<sec id="sec004-1-4">
<title>Mean Absolute Percentage Error (MAPE)</title>
<p>MAPE calculates the error as a percentage of the actual value, making it easier to interpret and compare across different datasets. As noted by Makridakis,<sup><xref ref-type="bibr" rid="ref41">41</xref></sup> MAPE remains one of the most commonly used metrics in forecasting competitions due to its intuitive nature and interpretability. However Evans,<sup><xref ref-type="bibr" rid="ref42">42</xref></sup> also pointed out that MAPE&#x2019;s sensitivity to low actual values may distort its usefulness, especially in datasets with high variability or occasional zero values. It is calculated as:</p>
<disp-formula id="M9"><label>(9)</label><mml:math id="DM9" display="block"><mml:mrow><mml:mtext>MAPE</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mn>1</mml:mn><mml:mi>n</mml:mi></mml:mfrac><mml:munderover><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:munderover ><mml:mo>&#x007C;</mml:mo><mml:mfrac><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x005E;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub></mml:mrow></mml:mfrac><mml:mo>&#x007C;</mml:mo><mml:mo>&#x00D7;</mml:mo><mml:mn>100</mml:mn></mml:mrow></mml:math></disp-formula>
<p><italic>&#x302;</italic></p>
<p>MAPE is useful when comparing forecast accuracy across different models and datasets, but it can be problematic when actual values are close to zero, leading to inflated error percentages.</p>
</sec>
<sec id="sec004-1-5">
<title>R-Squared (R<sup><xref ref-type="bibr" rid="ref2">2</xref></sup>)</title>
<p><italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> measures the proportion of the variance in the dependent variable that is predictable from the independent variables. According to Draper and Smith,<sup><xref ref-type="bibr" rid="ref43">43</xref></sup> <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> is widely used in regression analysis as it succinctly summarizes the explanatory power of a model. However, as noted by Alexander,<sup><xref ref-type="bibr" rid="ref44">44</xref></sup> <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> alone can be misleading in evaluating model performance, especially in cases of overfitting or when used with nonlinear models, thus warranting the use of adjusted <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> or complementary metrics. It is calculated as:</p>
<disp-formula id="M10"><label>(10)</label><mml:math id="DM10" display="block"><mml:mrow><mml:msup><mml:mi>R</mml:mi><mml:mn>2</mml:mn></mml:msup><mml:mo>=</mml:mo><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msup><mml:mrow><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x005E;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy='false'>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow><mml:mrow><mml:msubsup><mml:mstyle mathsize='140%' displaystyle='true'><mml:mo>&#x2211;</mml:mo></mml:mstyle><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>n</mml:mi></mml:msubsup><mml:msup><mml:mrow><mml:mo stretchy='false'>(</mml:mo><mml:msub><mml:mi>y</mml:mi><mml:mi>i</mml:mi></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mover accent='true'><mml:mi>y</mml:mi><mml:mo>&#x00AF;</mml:mo></mml:mover><mml:mi>i</mml:mi></mml:msub><mml:mo stretchy='false'>)</mml:mo></mml:mrow><mml:mn>2</mml:mn></mml:msup></mml:mrow></mml:mfrac></mml:mrow></mml:math></disp-formula>
<p><italic>&#x302;</italic></p>
<p>Where <italic>y</italic> is the mean of the observed values. <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> provides a measure of the goodness-of-fit, indicating how well the model explains the variation in the data. A higher <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> value indicates a better model fit, though it does not always correlate with improved prediction accuracy, particularly in complex datasets (<xref ref-type="table" rid="T7">Table 7</xref>).</p>
<table-wrap id="T7">
<label>Table 7</label>
<caption><title>Comparison of performance metrics for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Metric</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Weaknesses</th>
<th valign="top" align="left">Best Used For</th>
<th valign="top" align="left">Sensitivity to Outliers</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">MSE</td>
<td valign="top" align="left">Penalizes large errors, easy to compute</td>
<td valign="top" align="left">Sensitive to outliers, hard to interpret</td>
<td valign="top" align="left">Measuring overall error magnitude</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">37,38</td>
</tr>
<tr>
<td valign="top" align="left">RMSE</td>
<td valign="top" align="left">Intuitive, in original units of data</td>
<td valign="top" align="left">Sensitive to large errors</td>
<td valign="top" align="left">Performance comparison across models</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">39,40</td>
</tr>
<tr>
<td valign="top" align="left">MAE</td>
<td valign="top" align="left">Less sensitive to outliers</td>
<td valign="top" align="left">Does not penalize large errors enough</td>
<td valign="top" align="left">When outliers are not as critical</td>
<td valign="top" align="left">Low</td>
<td valign="top" align="left">38,39</td>
</tr>
<tr>
<td valign="top" align="left">MAPE</td>
<td valign="top" align="left">Easily interpretable, percentage-based</td>
<td valign="top" align="left">Issues with values close to zero</td>
<td valign="top" align="left">Comparing models across datasets</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">41,42</td>
</tr>
<tr>
<td valign="top" align="left"><italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup></td>
<td valign="top" align="left">Indicates how well the model fits data</td>
<td valign="top" align="left">Does not guarantee prediction accuracy</td>
<td valign="top" align="left">Evaluating goodness-of-fit</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">43,44</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="sec004-2">
<title>Strengths and Limitations of Different ML Models</title>
<p>Typically, when choosing an ML model for energy load forecasting, one needs to evaluate the strengths and weaknesses of each model in terms of the nature of the energy load forecasting task. The performance may vary from model to model according to the complexity of the data available and the length of the forecasting horizon as well as the amount of historical data available.</p>
<sec id="sec004-2-1">
<title>Traditional ML Models</title>
<p>Popular traditional ML models include linear regression, DTs, SVMs, and RF which are always popular for their interpretability and ease of implementation. These models are best applicable for reasonably simple, short-term forecasting tasks with relatively simpler and easy-to-understand data. But they are not very useful with long-term dependencies or high nonlinearity in the process data. For instance,Hippert et al.<sup><xref ref-type="bibr" rid="ref45">45</xref></sup> and Wang et al.<sup><xref ref-type="bibr" rid="ref46">46</xref></sup> demonstrated the effectiveness of linear regression in short-term load forecasting due to its simplicity and speed. DTs, as shown by Liu et al.<sup><xref ref-type="bibr" rid="ref47">47</xref></sup> and, Singh et al.<sup><xref ref-type="bibr" rid="ref48">48</xref></sup> are useful for capturing nonlinear relationships in structured energy data. Meanwhile, RF have been proven robust in handling noisy data and enhancing forecasting accuracy, as shown in the works of Lahouar et al.<sup><xref ref-type="bibr" rid="ref49">49</xref></sup> and, Deb et al.<sup><xref ref-type="bibr" rid="ref50">50</xref></sup> particularly in short-term electricity demand forecasting (<xref ref-type="table" rid="T8">Table 8</xref>).</p>
<table-wrap id="T8">
<label>Table 8</label>
<caption><title>Comparison of traditional ML models for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Limitations</th>
<th valign="top" align="left">Best Use Case</th>
<th valign="top" align="left">Computational Complexity</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Linear regression</td>
<td valign="top" align="left">Simple, interpretable</td>
<td valign="top" align="left">Limited to linear relationships</td>
<td valign="top" align="left">Baseline forecasting, short-term forecasts</td>
<td valign="top" align="left">Low</td>
<td valign="top" align="left">45,46</td>
</tr>
<tr>
<td valign="top" align="left">DT</td>
<td valign="top" align="left">Handles nonlinear relationships</td>
<td valign="top" align="left">Prone to overfitting, poor generalization</td>
<td valign="top" align="left">Small to medium-sized datasets</td>
<td valign="top" align="left">Medium</td>
<td valign="top" align="left">47,48</td>
</tr>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="left">Robust, reduces overfitting</td>
<td valign="top" align="left">Less interpretable, computationally intensive</td>
<td valign="top" align="left">Complex forecasting tasks</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">49,50</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec004-2-2">
<title>DL Models</title>
<p>Indeed, energy load forecasting is a good application for DL models, especially LSTM networks, GRU, and even ANN. These models are capable of capturing the time series and the nonlinear patterns within a large amount of data. This type of model is great in finding long-term trends and fine relationships between time series data, which are perfect for predicting purposes when historical consumption data is used as a fundamental in forecasting future energy demand.</p>
<p>LSTM and GRU are structures of rather diverse DL models, being parts of the RNN, which aims to deal more efficiently with sequential data compared to classic feed-forward networks, e.g., ANN. GRUs are known to be not as good as LSTMs at capturing long-term dependencies in time series data; however, GRUs are computationally lighter and more efficient at performing similar tasks as LSTMs. Several studies have validated this: Kuster et al.<sup><xref ref-type="bibr" rid="ref51">51</xref></sup> and Suganthi and Samuel<sup><xref ref-type="bibr" rid="ref52">52</xref></sup> demonstrated the utility of ANN in modeling complex energy consumption behaviors due to its flexibility and learning capabilities. LSTMs, as applied by Marino et al.<sup><xref ref-type="bibr" rid="ref53">53</xref></sup> and, Kong et al.<sup><xref ref-type="bibr" rid="ref54">54</xref></sup> have shown exceptional performance in capturing long-term dependencies in electricity demand prediction. Meanwhile, GRUs have been successfully employed by Liu et al.<sup><xref ref-type="bibr" rid="ref55">55</xref></sup> and, Liang et al.<sup><xref ref-type="bibr" rid="ref56">56</xref></sup> where they offered competitive accuracy with reduced computational overhead compared to LSTMs, making them suitable for real-time forecasting applications (<xref ref-type="table" rid="T9">Table 9</xref>).</p>
<table-wrap id="T9">
<label>Table 9</label>
<caption><title>Comparison of DL models for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Limitations</th>
<th valign="top" align="left">Best Use Case</th>
<th valign="top" align="left">Computational Complexity</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">ANN</td>
<td valign="top" align="left">Captures nonlinear relationships, flexible</td>
<td valign="top" align="left">Needs large datasets, prone to overfitting</td>
<td valign="top" align="left">Medium-term forecasting, large datasets</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">51,52</td>
</tr>
<tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="left">Long-term dependency handling, robust for time series</td>
<td valign="top" align="left">Computationally expensive, complex tuning</td>
<td valign="top" align="left">Long-term forecasting, capturing seasonality</td>
<td valign="top" align="left">Very High</td>
<td valign="top" align="left">53,54</td>
</tr>
<tr>
<td valign="top" align="left">GRU</td>
<td valign="top" align="left">Efficient, faster training, captures temporal dependencies</td>
<td valign="top" align="left">May not capture long-range dependencies as well as LSTM</td>
<td valign="top" align="left">Short to medium-term forecasting, large datasets</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">55,56</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec004-2-3">
<title>Ensemble Approaches</title>
<p>Ensemble methods like boosting (e.g., XGBoost) and bagging (e.g., RF) combine multiple models to improve forecasting accuracy and reduce variance. These methods are highly effective in energy load forecasting, particularly for datasets with noisy or fluctuating patterns. However, several researchers have demonstrated the effectiveness of these ensemble approaches. For boosting, Hong et al.<sup><xref ref-type="bibr" rid="ref57">57</xref></sup> applied gradient boosted regression trees (GBRTs) to improve short-term load forecasting accuracy in large-scale smart grid applications, while Taieb and Hyndman<sup><xref ref-type="bibr" rid="ref58">58</xref></sup> evaluated boosting strategies for probabilistic forecasting in energy systems. For bagging, Lahouar and Slama<sup><xref ref-type="bibr" rid="ref59">59</xref></sup> showed that RFs provided high accuracy and robustness in hourly electricity demand prediction and Zhou et al.<sup><xref ref-type="bibr" rid="ref60">60</xref></sup> confirmed their efficiency in handling feature-rich energy datasets and capturing nonlinear relationships (<xref ref-type="table" rid="T10">Table 10</xref>).</p>
<table-wrap id="T10">
<label>Table 10</label>
<caption><title>Comparison of ensemble approaches for energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Model</th>
<th valign="top" align="left">Strengths</th>
<th valign="top" align="left">Limitations</th>
<th valign="top" align="left">Best Use Case</th>
<th valign="top" align="left">Computational Complexity</th>
<th valign="top" align="left">References</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Boosting</td>
<td valign="top" align="left">Improves weak learners, high accuracy</td>
<td valign="top" align="left">Overfitting, sensitive to noisy data</td>
<td valign="top" align="left">Complex, noisy datasets, high-variance forecasting</td>
<td valign="top" align="left">High</td>
<td valign="top" align="left">57,58</td>
</tr>
<tr>
<td valign="top" align="left">Bagging</td>
<td valign="top" align="left">Reduces overfitting, stable</td>
<td valign="top" align="left">Less interpretable, computationally expensive</td>
<td valign="top" align="left">Large datasets, medium-term forecasting</td>
<td valign="top" align="left">Medium-High</td>
<td valign="top" align="left">59</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Selecting the right ML technique for energy load forecasting depends on the specific characteristics of the dataset and the forecasting horizon. While traditional models are efficient and easy to interpret, DL and ensemble approaches offer superior accuracy in complex scenarios. Performance metrics such as MSE, RMSE, MAE, and <italic>R</italic><sup><xref ref-type="bibr" rid="ref2">2</xref></sup> play a vital role in comparing and selecting the best model for a given task.</p>
</sec>
</sec>
</sec>
<sec id="sec005">
<title>Challenges and Future Directions</title>
<p>In smart grids, energy load forecasting is extremely important for effective energy distribution and real-time usage management. Despite advancements, several challenges remain unresolved, particularly those related to improving prediction accuracy, model scalability, and general applicability across diverse systems. These challenges not only hinder current progress but also highlight key directions for future research and innovation in this field (<xref ref-type="table" rid="T9">Table 9</xref>).</p>
<sec id="sec005-1">
<title>Data Availability and Quality Issues</title>
<p>The availability and quality of data are considered to be among the main issues in energy load forecasting. Most of the effectiveness of ML models lies in the richness and reliability of the dataset that they are trained on. Often, the energy load data is sparse, noisy, and incomplete, and hence it results in inaccurate prediction.<sup><xref ref-type="bibr" rid="ref61">61</xref></sup> Recovery Digital Data, a source for historically obsolete utility consumption data, is often ill-suited for the months and years before a system implemented this type of data. In addition, data from various sources might not be standardized, and thus, it becomes challenging to concatenate heterogeneous datasets to train predictive models.<sup><xref ref-type="bibr" rid="ref62">62</xref></sup></p>
<p>There is another important issue: the quality of data. Typically, energy load data contains missing values, outliers, and errors that can do a lot of harm to model performance. Although the data may always be available, it does not always mean it covers all the possible conditions that affect energy consumption, such as weather events, special holidays, or unusual spikes of demand.<sup><xref ref-type="bibr" rid="ref63">63</xref></sup> Further, data heterogeneity, or where different sources collect data in various formats at different scales and intervals, also creates an issue. All of these factors contribute to the difficulty in developing such generalizable, accurate models. In future research, these aspects should be improved concerning data acquisition, data format standardization, and robust data handling methods for missing and noisy data.<sup><xref ref-type="bibr" rid="ref64">64</xref></sup></p>
</sec>
<sec id="sec005-2">
<title>Computational Complexity and Model Interpretability</title>
<p>Energy load forecasting is another challenge and calls for computing complexity due to the usage of advanced ML models such as DL. Only with models like LSTMs networks and GRUs, we get good accuracy, but at a high cost of computation in terms of training and inference.<sup><xref ref-type="bibr" rid="ref65">65</xref></sup> Such models can be quite expensive in terms of processing power and time, as well as storage, in particular when large and high-dimensional sets of data are involved. Therefore, these models cannot be deployed in real time or on a vast scale, thus making them unfeasible for some utilities or organizations regarding the resources required and the cost associated with such deployment.<sup><xref ref-type="bibr" rid="ref66">66</xref></sup></p>
<p>In addition, DL models are also complex, and this constitutes a potential problem with model interpretability. Accurate prediction of energy consumption is not the only thing important in energy load forecasting; we also need to know why we predicted such things.<sup><xref ref-type="bibr" rid="ref67">67</xref></sup> Smart grids are particularly important given the need among stakeholders, grid operators, and regulators, as well as end users, to interpret how and why particular energy usage patterns are predicted. Often, such complex black box models, such as deep neural networks, cannot provide users with deep insight into factors that would either enable them to trust the predicted value or act on that particular prediction.<sup><xref ref-type="bibr" rid="ref68">68</xref></sup> Future research should aim to strike a balance between model complexity and interpretability, possibly through the integration of explainable artificial intelligence (XAI) techniques that can shed light on the decision-making process of these models without compromising their predictive power.<sup><xref ref-type="bibr" rid="ref69">69</xref></sup></p>
</sec>
<sec id="sec005-3">
<title>Potential Improvements and Emerging Trends</title>
<p>Despite them, there are some trends and potential for improving the effectiveness of energy load forecasting models. The area of incorporation of external factors is what is being proposed: weather conditions, socioeconomic factors, and real-time events. However, it turns out that these variables can have a major effect on energy demand without affecting forecasting models that rely heavily on historical load data.<sup><xref ref-type="bibr" rid="ref70">70</xref></sup> Introducing the real-time data from the sensors, weather forecasting models, and social media trends, ML models can come up with more accurate and timely predictions as they inherently consider both predictable and unpredictable events.</p>
<p>Furthermore, it is also important that attempts for the integration of hybrid models, those that combine the strength of multiple ML technologies, should also be moving forward. Hybrid approaches, such as combining DL models with traditional ML models like RF or SVMs, can help improve model accuracy and robustness by leveraging the strengths of each individual model.<sup><xref ref-type="bibr" rid="ref71">71</xref></sup> In other words, DL models are great at processing huge amounts of data with intricate interrelationships, while quaint models have increased ability to interpret and run faster on a computer. By joining the use of these approaches, researchers can yet develop more accurate, simple, and readable forecasting systems.<sup><xref ref-type="bibr" rid="ref72">72</xref></sup></p>
<p>Another promising direction is the application of federated learning, where ML models are trained across multiple decentralized devices or nodes without transferring raw data. This is useful for collaborative learning across regions or utility companies within the context of smart grids while maintaining the privacy of data and minimizing the storage to be centralized.<sup><xref ref-type="bibr" rid="ref73">73</xref></sup> Furthermore, in circumstances where data sharing is restricted due to regulatory limitations, federated learning could prove very useful.</p>
<p>Finally, another emerging trend is to incorporate RL techniques into energy load forecasting. This is because RL models can continuously learn and adapt to an environment that is changing, and that is precisely the case for dynamic, real-time forecasting scenarios.<sup><xref ref-type="bibr" rid="ref65">65</xref></sup> As energy consumption patterns change due to factors like economic shifts, population growth, or new energy policies, RL models could help adjust forecasting strategies on the fly, improving the accuracy of long-term predictions.</p>
</sec>
<sec id="sec005-4">
<title>Limitations in Benchmarking and Evaluation Practices</title>
<p>Another key challenge in energy load forecasting research lies in the inconsistency and limitations of benchmarking practices. A significant number of studies rely on private or domain-specific datasets, which limits the comparability of results across different models and research groups. This lack of standard publicly available datasets leads to fragmented progress and makes it difficult to reproduce results or validate the effectiveness of newly proposed methods.<sup><xref ref-type="bibr" rid="ref66">66</xref></sup> Moreover, the evaluation metrics used in various studies are not always uniform. While metrics like MAE, RMSE, and MAPE are common, their application without proper context&#x2014;such as normalization, peak-hour analysis, or seasonal decomposition&#x2014;can obscure the practical implications of model performance.<sup><xref ref-type="bibr" rid="ref74">74</xref></sup> Some studies also report results on short forecasting horizons only, ignoring the long-term performance stability of models. Therefore, there is a pressing need for the development of standardized benchmarking protocols, unified datasets, and comprehensive evaluation frameworks that consider multiple forecasting horizons, variable load types, and model robustness under different operational scenarios (<xref ref-type="table" rid="T11">Table 11</xref>).</p>
<table-wrap id="T11">
<label>Table 11</label>
<caption><title>Overview of key challenges and aligned future directions in energy load forecasting</title></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Challenge</th>
<th valign="top" align="left">Description</th>
<th valign="top" align="left">Aligned Future Direction</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Data availability and quality</td>
<td valign="top" align="left">Incomplete, noisy, or nonstandardized datasets hinder model accuracy and generalizability</td>
<td valign="top" align="left">Data standardization, robust preprocessing, integration of real-time sources</td>
</tr>
<tr>
<td valign="top" align="left">Data heterogeneity</td>
<td valign="top" align="left">Varying formats, scales, and intervals from different sources make it hard to train unified models</td>
<td valign="top" align="left">Federated learning and unified data representation methods</td>
</tr>
<tr>
<td valign="top" align="left">Computational complexity</td>
<td valign="top" align="left">High computational cost for training and deployment, especially for DL models</td>
<td valign="top" align="left">Lightweight hybrid models, hardware-aware optimization</td>
</tr>
<tr>
<td valign="top" align="left">Model interpretability</td>
<td valign="top" align="left">Deep models act as black boxes, reducing trust and usability for decision-making</td>
<td valign="top" align="left">XAI integration, model simplification</td>
</tr>
<tr>
<td valign="top" align="left">Scalability across regions/systems</td>
<td valign="top" align="left">Models often trained on a small scale or local data may not generalize well</td>
<td valign="top" align="left">Federated learning, transfer learning</td>
</tr>
<tr>
<td valign="top" align="left">Forecasting under uncertainty</td>
<td valign="top" align="left">Limited adaptability to changing patterns due to events or policy shifts</td>
<td valign="top" align="left">RL, real-time adaptive models</td>
</tr>
<tr>
<td valign="top" align="left">Benchmarking and evaluation practices</td>
<td valign="top" align="left">Lack of standardized datasets and inconsistent use of evaluation metrics</td>
<td valign="top" align="left">Common benchmarking protocols, open-access repositories</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="sec006" sec-type="conclusions">
<title>Conclusion</title>
<p>Energy load forecasting is an important task to improve the energy distribution and to increase the operational efficiency of smart grids. It has been shown that a wide array of ML techniques can be effectively applied in order to boost the forecasting accuracy to a point where better decisions can be made by energy providers, while at the same time enhancing the pursuit of the sustainability goal of energy consumption efficiency. Different aspects of the forecasting task, for instance, the length of the forecast horizon, the complexity of the data and computational resources, show that traditional ML models, DL architectures like LSTMs and GRUs, and ensemble methods all have different benefits.</p>
<p>Yet, there are several challenges that have not yet been overcome in order to fully unleash these models&#x2019; potential. Nevertheless, despite these issues related to the data availability and quality, including sparse and noisy datasets, there has not been much progress in developing accurate and robust forecasting systems. As for the computational complexity of such models, especially of DL, which is quite advanced, it raises doubts about the possibility of their real-time implementation in a resource constrained environment. Furthermore, model interpretability is an open issue for the smart grid system stakeholders since the models need to explain and convince stakeholders of the predictions.</p>
<p>This study has several limitations. First, the review considered only peer-reviewed papers written in English, so relevant work published in other languages or in industry reports may have been missed. Second, most of the evidence is drawn from small-scale case studies focused on temperate-region grids, which may limit the generalizability of the findings to larger or more climate-diverse systems. Third, the analysis groups models by broad families rather than by specific architectural choices, which can hide finer factors that affect performance. Finally, the study does not quantify the economic impact of forecast errors, leaving the practical value of the reported accuracy gains open to further verification.</p>
</sec>
</body>
<back>
<fn-group>
<fn id="n1" fn-type="other">
<p>Additional material is published online only. To view please visit the journal online.</p>
<p><bold>Cite this as:</bold> Manzoor MF. Energy Load Forecasting with Machine Learning: Models, Metrics, and Future Directions. Premier Journal of Artificial Intelligence 2025;4:100018</p>
<p><bold>DOI:</bold> https://doi.org/10.70389/PJAI.100018</p>
</fn>
<fn id="n2" fn-type="other">
<p><bold>Ethical approval</bold></p>
<p>N/a</p>
</fn>
<fn id="n3" fn-type="other">
<p><bold>Consent</bold></p>
<p>N/a</p>
</fn>
<fn id="n4" fn-type="other">
<p><bold>Funding</bold></p>
<p>No industry funding</p>
</fn>
<fn id="n5" fn-type="conflict">
<p><bold>Conflicts of interest</bold></p>
<p>None</p>
</fn>
<fn id="n6" fn-type="other">
<p><bold>Author contribution</bold></p>
<p>Muhammad Faraz Manzoor &#x2013; Conceptualization, Writing &#x2013; original draft, review and editing</p>
</fn>
<fn id="n7" fn-type="other">
<p><bold>Guarantor</bold></p>
<p>Muhammad Faraz Manzoor</p>
</fn>
<fn id="n8" fn-type="other">
<p><bold>Provenance and peer-review</bold></p>
<p>Unsolicited and externally peer-reviewed</p>
</fn>
<fn id="n9" fn-type="other">
<p><bold>Data availability statement</bold></p>
<p>N/a</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="ref1"><label>1</label><mixed-citation publication-type="journal"><string-name><surname>Cui</surname> <given-names>X</given-names></string-name>, <string-name><surname>Zhu</surname> <given-names>J</given-names></string-name>, <string-name><surname>Jia</surname> <given-names>L</given-names></string-name>, <string-name><surname>Wang</surname> <given-names>J</given-names></string-name>, <string-name><surname>Wu</surname> <given-names>Y</given-names></string-name>. <article-title>A novel heat load prediction model of district heating system based on hybrid whale optimization algorithm (WOA) and CNN-LSTM with attention mechanism</article-title>. <source>Energy</source>. <year>2024</year>;<volume>312</volume>:<issue>133536</issue>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.energy.2024.133536">https://doi.org/10.1016/j.energy.2024.133536</ext-link></mixed-citation></ref>
<ref id="ref2"><label>2</label><mixed-citation publication-type="journal"><string-name><surname>Shrestha</surname> <given-names>A</given-names></string-name>, <string-name><surname>Mahmood</surname> <given-names>A</given-names></string-name>. <article-title>Review of deep learning algorithms and architectures</article-title>. <source>IEEE Access</source>. <year>2019</year>;<volume>7</volume>:<fpage>53040</fpage>&#x2013;<lpage>65</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/ACCESS.2019.2912200">https://doi.org/10.1109/ACCESS.2019.2912200</ext-link></mixed-citation></ref>
<ref id="ref3"><label>3</label><mixed-citation publication-type="journal"><string-name><surname>Mekonnen</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Namuduri</surname> <given-names>S</given-names></string-name>, <string-name><surname>Burton</surname> <given-names>L</given-names></string-name>, <string-name><surname>Sarwat</surname> <given-names>A</given-names></string-name>, <string-name><surname>Bhansali</surname> <given-names>S</given-names></string-name>. <article-title>Review&#x2014;machine learning techniques in wireless sensor network based precision agriculture</article-title>. <source>J Electrochem Soc</source>. <year>2020</year>;<volume>167</volume>(<issue>3</issue>):<fpage>037522</fpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1149/2.0222003JES">https://doi.org/10.1149/2.0222003JES</ext-link></mixed-citation></ref>
<ref id="ref4"><label>4</label><mixed-citation publication-type="journal"><string-name><surname>Agupugo</surname> <given-names>CP</given-names></string-name>, <string-name><surname>Ajayi</surname> <given-names>AO</given-names></string-name>, <string-name><surname>Nwanevu</surname> <given-names>C</given-names></string-name>, <string-name><surname>Oladipo</surname> <given-names>SS</given-names></string-name>. <article-title>Policy and regulatory framework supporting renewable energy microgrids and energy storage systems</article-title>. <source>Eng Sci Technol J</source>. <year>2024</year>;<volume>5</volume>(<issue>8</issue>):<fpage>2589</fpage>&#x2013;<lpage>615</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.51594/estj.v5i8.1460">https://doi.org/10.51594/estj.v5i8.1460</ext-link></mixed-citation></ref>
<ref id="ref5"><label>5</label><mixed-citation publication-type="journal"><string-name><surname>Nuthakki</surname> <given-names>S</given-names></string-name>, <string-name><surname>Kulkarni</surname> <given-names>CS</given-names></string-name>, <string-name><surname>Kathiriya</surname> <given-names>S</given-names></string-name>, <string-name><surname>Nuthakki</surname> <given-names>Y</given-names></string-name>. <article-title>Artificial intelligence applications in natural gas industry: a literature review</article-title>. <source>Int J Eng Adv Technol</source>. <year>2024</year>;<volume>13</volume>(<issue>3</issue>):<fpage>64</fpage>&#x2013;<lpage>70</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.35940/ijeat.c4383.13030224.">https://doi.org/10.35940/ijeat.c4383.13030224.</ext-link></mixed-citation></ref>
<ref id="ref6"><label>6</label><mixed-citation publication-type="journal"><string-name><surname>Nuthakki</surname> <given-names>S</given-names></string-name>, <string-name><surname>Buddiga</surname> <given-names>SKP</given-names></string-name>, <string-name><surname>Koganti</surname> <given-names>S</given-names></string-name>. <article-title>Exploring deep learning models for image recognition: a comparative review</article-title>. <source>Signal Image Process An Int J</source>. <year>2024</year>;<volume>15</volume>(<issue>3</issue>):<fpage>1</fpage>&#x2013;<lpage>10</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5121/sipij.2024.15301">https://doi.org/10.5121/sipij.2024.15301</ext-link></mixed-citation></ref>
<ref id="ref7"><label>7</label><mixed-citation publication-type="journal"><string-name><surname>Patil</surname> <given-names>S</given-names></string-name>, <string-name><surname>Awan</surname> <given-names>KH</given-names></string-name>, <string-name><surname>Arakeri</surname> <given-names>G</given-names></string-name>, <string-name><surname>Seneviratne</surname> <given-names>CJ</given-names></string-name>, <string-name><surname>Muddur</surname> <given-names>N</given-names></string-name>, <string-name><surname>Malik</surname> <given-names>S</given-names></string-name>, <etal>et al.</etal> <article-title>Machine learning and its potential applications to the genomic study of head and neck cancer&#x2014;a systematic review</article-title>. <source>J Oral Pathol Med</source>. <year>2019</year>;<volume>48</volume>(<issue>9</issue>):<fpage>773</fpage>&#x2013;<lpage>79</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1111/jop.12854">https://doi.org/10.1111/jop.12854</ext-link></mixed-citation></ref>
<ref id="ref8"><label>8</label><mixed-citation publication-type="journal"><string-name><surname>Nallore</surname> <given-names>SS</given-names></string-name>, <string-name><surname>Velumani</surname> <given-names>A</given-names></string-name>, <string-name><surname>Reddimasu</surname> <given-names>V</given-names></string-name>. <article-title>Machine learning for early detection of neurodegenerative diseases</article-title>. <source>Int J Res Publ Rev</source>. <year>2023</year>;<volume>4</volume>(<issue>11</issue>):<fpage>1894</fpage>&#x2013;<lpage>909</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.55248/gengpi.4.1123.113123">https://doi.org/10.55248/gengpi.4.1123.113123</ext-link></mixed-citation></ref>
<ref id="ref9"><label>9</label><mixed-citation publication-type="journal"><string-name><surname>Gou</surname> <given-names>J</given-names></string-name>, <string-name><surname>Yu</surname> <given-names>B</given-names></string-name>, <string-name><surname>Maybank</surname> <given-names>SJ</given-names></string-name>, <string-name><surname>Tao</surname> <given-names>D</given-names></string-name>. <article-title>Knowledge distillation: a survey</article-title>. <source>Int J Comput Vis</source>. <year>2021</year>;<volume>129</volume>(<issue>6</issue>):<fpage>1789</fpage>&#x2013;<lpage>819</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s11263-021-01453-z">https://doi.org/10.1007/s11263-021-01453-z</ext-link></mixed-citation></ref>
<ref id="ref10"><label>10</label><mixed-citation publication-type="journal"><string-name><surname>Manzoor</surname> <given-names>MF</given-names></string-name>, <string-name><surname>Farooq</surname> <given-names>MS</given-names></string-name>, <string-name><surname>Haseeb</surname> <given-names>M</given-names></string-name>, <string-name><surname>Farooq</surname> <given-names>U</given-names></string-name>, <string-name><surname>Khalid</surname> <given-names>S</given-names></string-name>, <string-name><surname>Abid</surname> <given-names>A</given-names></string-name>. <article-title>Exploring the landscape of intrinsic plagiarism detection: benchmarks, techniques, evolution, and challenges</article-title>. <source>IEEE Access</source>. <year>2023</year>;<volume>11</volume>:<fpage>140519</fpage>&#x2013;<lpage>45</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/ACCESS.2023.3338855">https://doi.org/10.1109/access.2023.3338855</ext-link></mixed-citation></ref>
<ref id="ref11"><label>11</label><mixed-citation publication-type="journal"><string-name><surname>Ishaq</surname> <given-names>M</given-names></string-name>, <string-name><surname>Abid</surname> <given-names>A</given-names></string-name>, <string-name><surname>Farooq</surname> <given-names>MS</given-names></string-name>, <string-name><surname>Manzoor</surname> <given-names>MF</given-names></string-name>, <string-name><surname>Farooq</surname> <given-names>U</given-names></string-name>, <string-name><surname>Abid</surname> <given-names>K</given-names></string-name>, <etal>et al.</etal> <article-title>Advances in database systems education: methods, tools, curricula, and way forward</article-title>. <source>Educ Inf Technol (Dordr)</source>. <year>2023</year>;<volume>28</volume>(<issue>3</issue>):<fpage>2681</fpage>&#x2013;<lpage>725</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s10639-022-11293-0">https://doi.org/10.1007/s10639-022-11293-0</ext-link></mixed-citation></ref>
<ref id="ref12"><label>12</label><mixed-citation publication-type="journal"><string-name><surname>Dridi</surname> <given-names>S</given-names></string-name>, <string-name><surname>Machine</surname> <given-names>V</given-names></string-name>, <string-name><surname>Tree</surname> <given-names>D</given-names></string-name>, <string-name><surname>Forest</surname> <given-names>R</given-names></string-name>, <string-name><surname>Regression</surname> <given-names>L</given-names></string-name>. <article-title>S l - a s l r</article-title>; <year>2021</year>.</mixed-citation></ref>
<ref id="ref13"><label>13</label><mixed-citation publication-type="journal"><string-name><surname>Alzubaidi</surname> <given-names>L</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>J</given-names></string-name>, <string-name><surname>Humaidi</surname> <given-names>AJ</given-names></string-name>, <string-name><surname>Al-Dujaili</surname> <given-names>A</given-names></string-name>, <string-name><surname>Duan</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Al-Shamma</surname> <given-names>O</given-names></string-name>, <etal>et al.</etal> <article-title>Review of deep learning: concepts, CNN architectures, challenges, applications, future directions</article-title>. <source>J Big Data</source>. <year>2021</year>;<volume>8</volume>:<issue>53</issue>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1186/s40537-021-00444-8">https://doi.org/10.1186/s40537-021-00444-8</ext-link></mixed-citation></ref>
<ref id="ref14"><label>14</label><mixed-citation publication-type="journal"><string-name><surname>Sarker</surname> <given-names>IH</given-names></string-name>. <article-title>Deep learning: a comprehensive overview on techniques, taxonomy, applications and research directions</article-title>. <source>SN Comput Sci</source>. <year>2021</year>;<volume>2</volume>(<issue>6</issue>):<fpage>1</fpage>&#x2013;<lpage>20</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s42979-021-00815-1">https://doi.org/10.1007/s42979-021-00815-1</ext-link></mixed-citation></ref>
<ref id="ref15"><label>15</label><mixed-citation publication-type="journal"><string-name><surname>S&#x00F6;derberg</surname> <given-names>MJ</given-names></string-name>, <string-name><surname>Meurling</surname> <given-names>A</given-names></string-name>. <article-title>Feature selection in short-term load forecasting</article-title>. <source>DIVA</source>; <year>2019</year>.</mixed-citation></ref>
<ref id="ref16"><label>16</label><mixed-citation publication-type="journal"><string-name><surname>Lahouar</surname> <given-names>A</given-names></string-name>, <string-name><surname>Ben Hadj Slama</surname> <given-names>J</given-names></string-name>. <article-title>Random forests model for one day ahead load forecasting</article-title>. <source>IREC 2015 6th Sixth international renewable energy congress</source>; <year>2015</year>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/IREC.2015.7110975">https://doi.org/10.1109/IREC.2015.7110975</ext-link></mixed-citation></ref>
<ref id="ref17"><label>17</label><mixed-citation publication-type="journal"><string-name><surname>Sarker</surname> <given-names>MT</given-names></string-name>, <string-name><surname>Alam</surname> <given-names>MJ</given-names></string-name>, <string-name><surname>Ramasamy</surname> <given-names>G</given-names></string-name>, <string-name><surname>Uddin</surname> <given-names>MN</given-names></string-name>. <article-title>Energy demand forecasting of remote areas using linear regression and inverse matrix analysis</article-title>. <source>Int J Electr Comput Eng</source>. <year>2024</year>;<volume>14</volume>(<issue>1</issue>):<fpage>129</fpage>&#x2013;<lpage>39</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.11591/ijece.v14i1.pp129-139">https://doi.org/10.11591/ijece.v14i1.pp129-139</ext-link></mixed-citation></ref>
<ref id="ref18"><label>18</label><mixed-citation publication-type="journal"><string-name><surname>Mahmud</surname> <given-names>MA</given-names></string-name>. <article-title>Isolated area load forecasting using linear regression analysis: practical approach</article-title>. <source>Energy Power Eng</source>. <year>2011</year>;<volume>3</volume>(<issue>4</issue>):<fpage>547</fpage>&#x2013;<lpage>50</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.4236/epe.2011.34067">https://doi.org/10.4236/epe.2011.34067</ext-link></mixed-citation></ref>
<ref id="ref19"><label>19</label><mixed-citation publication-type="journal"><string-name><surname>Hambali</surname> <given-names>M</given-names></string-name>, <string-name><surname>Akinyemi</surname> <given-names>A</given-names></string-name>, <string-name><surname>Oladunjoye</surname> <given-names>J</given-names></string-name>, <string-name><surname>Yusuf</surname> <given-names>N</given-names></string-name>. <article-title>Electric power load forecast using decision tree algorithms</article-title>. <source>Comput Inf Syst Dev Informatics Allied Res J</source>. <year>2016</year>;<volume>7</volume>(<issue>4</issue>):<fpage>29</fpage>&#x2013;<lpage>42</lpage>.</mixed-citation></ref>
<ref id="ref20"><label>20</label><mixed-citation publication-type="journal"><string-name><surname>Jahan</surname> <given-names>IS</given-names></string-name>, <string-name><surname>Snasel</surname> <given-names>V</given-names></string-name>, <string-name><surname>Misak</surname> <given-names>S</given-names></string-name>. <article-title>Intelligent systems for power load forecasting: a study review</article-title>. <source>Energies</source>. <year>2020</year>;<volume>13</volume>(<issue>22</issue>):<fpage>1</fpage>&#x2013;<lpage>12</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3390/en13226105">https://doi.org/10.3390/en13226105</ext-link></mixed-citation></ref>
<ref id="ref21"><label>21</label><mixed-citation publication-type="journal"><string-name><surname>Tian</surname> <given-names>L</given-names></string-name>, <string-name><surname>Noore</surname> <given-names>A</given-names></string-name>. <article-title>A novel approach for short-term load forecasting using support vector machines</article-title>. <source>Int J Neural Syst</source>. <year>2004</year>;<volume>14</volume>(<issue>5</issue>):<fpage>329</fpage>&#x2013;<lpage>35</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1142/S0129065704002078">https://doi.org/10.1142/S0129065704002078</ext-link></mixed-citation></ref>
<ref id="ref22"><label>22</label><mixed-citation publication-type="journal"><string-name><surname>Li</surname> <given-names>EYY</given-names></string-name>, <string-name><surname>Fang</surname> <given-names>T</given-names></string-name>. <article-title>Study of support vector machines for short-term load forecasting</article-title>. <source>Proc. CSEE</source> <year>2003</year>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1142/9789812796769_0063">https://doi.org/10.1142/9789812796769_0063</ext-link></mixed-citation></ref>
<ref id="ref23"><label>23</label><mixed-citation publication-type="journal"><string-name><surname>Dudek</surname> <given-names>G</given-names></string-name>. <article-title>Short-term load forecasting using random forests</article-title>. <source>Adv Intell Syst Comput</source>. <year>2015</year>;<volume>323</volume>:<fpage>821</fpage>&#x2013;<lpage>28</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-3-319-11310-4_71">https://doi.org/10.1007/978-3-319-11310-4_71</ext-link></mixed-citation></ref>
<ref id="ref24"><label>24</label><mixed-citation publication-type="journal"><string-name><surname>Gao</surname> <given-names>J</given-names></string-name>, <string-name><surname>Wang</surname> <given-names>K</given-names></string-name>, <string-name><surname>Kang</surname> <given-names>X</given-names></string-name>, <string-name><surname>Li</surname> <given-names>H</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>S</given-names></string-name>. <article-title>Ultra-short-term electricity load forecasting based on improved random forest algorithm</article-title>. <source>AIP Adv</source>. <year>2023</year>;<volume>13</volume>(<issue>6</issue>):<fpage>065208</fpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1063/5.0153550">https://doi.org/10.1063/5.0153550</ext-link></mixed-citation></ref>
<ref id="ref25"><label>25</label><mixed-citation publication-type="journal"><string-name><surname>Oreshkin</surname> <given-names>BN</given-names></string-name>, <string-name><surname>Dudek</surname> <given-names>G</given-names></string-name>, <string-name><surname>Pe&#x142;ka</surname> <given-names>P</given-names></string-name>, <string-name><surname>Turkina</surname> <given-names>E</given-names></string-name>. <article-title>N-BEATS neural network for mid-term electricity load forecasting</article-title>. <source>Appl Energy</source>. <year>2021</year>;<volume>293</volume>:<fpage>1</fpage>&#x2013;<lpage>33</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.apenergy.2021.116918.">https://doi.org/10.1016/j.apenergy.2021.116918.</ext-link></mixed-citation></ref>
<ref id="ref26"><label>26</label><mixed-citation publication-type="journal"><string-name><surname>Gao</surname> <given-names>R</given-names></string-name>, <string-name><surname>Du</surname> <given-names>L</given-names></string-name>, <string-name><surname>Suganthan</surname> <given-names>PN</given-names></string-name>, <string-name><surname>Zhou</surname> <given-names>Q</given-names></string-name>, <string-name><surname>Yuen</surname> <given-names>KF</given-names></string-name>. <article-title>Random vector functional link neural network based ensemble deep learning for short-term load forecasting</article-title>. <source>Expert Syst Appl</source>. <year>2022</year>;<volume>206</volume>:<fpage>1</fpage>&#x2013;<lpage>10</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.eswa.2022.117784">https://doi.org/10.1016/j.eswa.2022.117784</ext-link></mixed-citation></ref>
<ref id="ref27"><label>27</label><mixed-citation publication-type="journal"><string-name><surname>Bayram</surname> <given-names>F</given-names></string-name>, <string-name><surname>Aupke</surname> <given-names>P</given-names></string-name>, <string-name><surname>Ahmed</surname> <given-names>BS</given-names></string-name>, <string-name><surname>Kassler</surname> <given-names>A</given-names></string-name>, <string-name><surname>Theocharis</surname> <given-names>A</given-names></string-name>, <string-name><surname>Forsman</surname> <given-names>J</given-names></string-name>. <article-title>DA-LSTM: a dynamic drift-adaptive learning framework for interval load forecasting with LSTM networks</article-title>. <source>Eng Appl Artif Intell</source>. <year>2023</year>;<volume>123</volume>:<fpage>0</fpage>&#x2013;<lpage>3</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.engappai.2023.106480">https://doi.org/10.1016/j.engappai.2023.106480</ext-link></mixed-citation></ref>
<ref id="ref28"><label>28</label><mixed-citation publication-type="journal"><string-name><surname>Lu</surname> <given-names>N</given-names></string-name>, <string-name><surname>Ouyang</surname> <given-names>Q</given-names></string-name>, <string-name><surname>Li</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Zou</surname> <given-names>C</given-names></string-name>. <article-title>Electrical load forecasting model using hybrid LSTM neural networks with online correction</article-title>. <source>arXiv:2403.03898</source>; <year>2024</year>:<fpage>1</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation></ref>
<ref id="ref29"><label>29</label><mixed-citation publication-type="journal"><string-name><surname>Emshagin</surname> <given-names>S</given-names></string-name>, <string-name><surname>Halim</surname> <given-names>WK</given-names></string-name>, <string-name><surname>Kashef</surname> <given-names>R</given-names></string-name>. <article-title>Short-term prediction of household electricity consumption using customized LSTM and GRU models</article-title>. <source>arXiv:2212.08757</source>; <year>2022</year>:<fpage>11</fpage>&#x2013;<lpage>30</lpage>.</mixed-citation></ref>
<ref id="ref30"><label>30</label><mixed-citation publication-type="journal"><string-name><surname>Dong</surname> <given-names>M</given-names></string-name>, <string-name><surname>Grumbach</surname> <given-names>L</given-names></string-name>. <article-title>A hybrid distribution feeder long-term load forecasting method based on sequence prediction</article-title>. <source>IEEE Trans Smart Grid</source>. <year>2020</year>;<volume>11</volume>(<issue>1</issue>):<fpage>470</fpage>&#x2013;<lpage>82</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/TSG.2019.2924183">https://doi.org/10.1109/TSG.2019.2924183</ext-link></mixed-citation></ref>
<ref id="ref31"><label>31</label><mixed-citation publication-type="journal"><string-name><surname>Ding</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Wu</surname> <given-names>D</given-names></string-name>, <string-name><surname>He</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Luo</surname> <given-names>X</given-names></string-name>, <string-name><surname>Deng</surname> <given-names>S</given-names></string-name>. <article-title>Highly-accurate electricity load estimation via knowledge aggregation</article-title>. <source>arXiv:2212.13913</source>; <year>2022</year>:<fpage>1</fpage>&#x2013;<lpage>6</lpage>.</mixed-citation></ref>
<ref id="ref32"><label>32</label><mixed-citation publication-type="journal"><string-name><surname>Rubattu</surname> <given-names>N</given-names></string-name>, <string-name><surname>Maroni</surname> <given-names>G</given-names></string-name>, <string-name><surname>Corani</surname> <given-names>G</given-names></string-name>. <article-title>Electricity load and peak forecasting: feature engineering, probabilistic LightGBM and temporal hierarchies</article-title>. <source>Lect Notes Comput Sci (including Subser. Lect. Notes Artif. Intell. Lect. Notes Bioinformatics)</source>. <year>2023</year>;<volume>14343</volume>:<fpage>276</fpage>&#x2013;<lpage>92</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-3-031-49896-1_18">https://doi.org/10.1007/978-3-031-49896-1_18</ext-link></mixed-citation></ref>
<ref id="ref33"><label>33</label><mixed-citation publication-type="journal"><string-name><surname>Dube</surname> <given-names>R</given-names></string-name>, <string-name><surname>Gautam</surname> <given-names>N</given-names></string-name>, <string-name><surname>Banerjee</surname> <given-names>A</given-names></string-name>. <article-title>Learning for interval prediction of electricity demand: a cluster-based bootstrapping approach</article-title>. <source>arXiv:2309.01336</source>; <year>2023</year>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2139/ssrn.4720434">https://doi.org/10.2139/ssrn.4720434</ext-link></mixed-citation></ref>
<ref id="ref34"><label>34</label><mixed-citation publication-type="journal"><string-name><surname>Olumba</surname> <given-names>WC</given-names></string-name>, <string-name><surname>Monday</surname> <given-names>HN</given-names></string-name>, <string-name><surname>Nneji</surname> <given-names>GU</given-names></string-name>, <string-name><surname>Agbonifo</surname> <given-names>D</given-names></string-name>, <string-name><surname>David</surname> <given-names>GM</given-names></string-name>, <string-name><surname>Umana</surname> <given-names>ES</given-names></string-name>, <etal>et al.</etal> <article-title>BaggingSHAP: a novel ensemble approach for high-accu- racy energy demand forecasting</article-title>. <year>2024</year>;<volume>198</volume>:<fpage>14</fpage>&#x2013;<lpage>28</lpage>.</mixed-citation></ref>
<ref id="ref35"><label>35</label><mixed-citation publication-type="journal"><string-name><surname>Zhang</surname> <given-names>C</given-names></string-name>, <string-name><surname>Peng</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>H</given-names></string-name>. <article-title>A hybrid model based on random forest and LSTM for short-term electricity load forecasting</article-title>. <source>IEEE Access</source>. <year>2020</year>;<volume>8</volume>:<fpage>119566</fpage>&#x2013;<lpage>76</lpage>.</mixed-citation></ref>
<ref id="ref36"><label>36</label><mixed-citation publication-type="journal"><string-name><surname>Ma</surname> <given-names>W</given-names></string-name>, <string-name><surname>Liu</surname> <given-names>X</given-names></string-name>, <string-name><surname>Wang</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Zhao</surname> <given-names>Y</given-names></string-name>. <article-title>Hybrid model of random forest and LSTM for electricity load forecasting</article-title>. <source>Energy Rep</source>. <year>2021</year>;<volume>7</volume>:<fpage>196</fpage>&#x2013;<lpage>203</lpage>.</mixed-citation></ref>
<ref id="ref37"><label>37</label><mixed-citation publication-type="journal"><string-name><surname>Chai</surname> <given-names>T</given-names></string-name>, <string-name><surname>Draxler</surname> <given-names>RR</given-names></string-name>. <article-title>Root mean square error (RMSE) or mean absolute error (MAE)? Arguments against avoiding RMSE in the literature</article-title>. <source>Geosci Model Dev</source>. <year>2014</year>;<volume>7</volume>(<issue>3</issue>):<fpage>1247</fpage>&#x2013;<lpage>50</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5194/gmd-7-1247-2014">https://doi.org/10.5194/gmd-7-1247-2014</ext-link></mixed-citation></ref>
<ref id="ref38"><label>38</label><mixed-citation publication-type="journal"><string-name><surname>Willmott</surname> <given-names>CJ</given-names></string-name>, <string-name><surname>Matsuura</surname> <given-names>K</given-names></string-name>. <article-title>Advantages of the mean absolute error (MAE) over the root mean square error (RMSE) in assessing average model performance</article-title>. <source>Clim Res</source>. <year>2005</year>;<volume>30</volume>(<issue>1</issue>):<fpage>79</fpage>&#x2013;<lpage>82</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3354/cr030079">https://doi.org/10.3354/cr030079</ext-link></mixed-citation></ref>
<ref id="ref39"><label>39</label><mixed-citation publication-type="journal"><string-name><surname>Hyndman</surname> <given-names>RJ</given-names></string-name>, <string-name><surname>Koehler</surname> <given-names>AB</given-names></string-name>. <article-title>Another look at measures of forecast accuracy</article-title>. <source>Int J Forecast</source>. <year>2005</year>;<volume>22</volume>:<fpage>679</fpage>&#x2013;<lpage>88</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ijforecast.2006.03.001">https://doi.org/10.1016/j.ijforecast.2006.03.001</ext-link></mixed-citation></ref>
<ref id="ref40"><label>40</label><mixed-citation publication-type="journal"><string-name><surname>Hong</surname> <given-names>T</given-names></string-name>, <string-name><surname>Pinson</surname> <given-names>P</given-names></string-name>, <string-name><surname>Fan</surname> <given-names>S</given-names></string-name>. <article-title>Global energy forecasting competition 2012</article-title>. <source>Int J Forecast</source>. <year>2014</year>;<volume>30</volume>(<issue>2</issue>):<fpage>357</fpage>&#x2013;<lpage>63</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.ijforecast.2013.07.001">https://doi.org/10.1016/j.ijforecast.2013.07.001</ext-link></mixed-citation></ref>
<ref id="ref41"><label>41</label><mixed-citation publication-type="journal"><string-name><surname>Makridakis</surname> <given-names>S</given-names></string-name>. <article-title>The M3-competition: results, conclusions and implications</article-title>. <source>Int J Forecast</source>. <year>2000</year>;<volume>16</volume>:<fpage>451</fpage>&#x2013;<lpage>76</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/S0169-2070(00)00057-1">https://doi.org/10.1016/S0169-2070(00)00057-1</ext-link></mixed-citation></ref>
<ref id="ref42"><label>42</label><mixed-citation publication-type="journal"><string-name><surname>Evans</surname> <given-names>MG</given-names></string-name>. <article-title>On the asymmetry of g</article-title>. <source>Psychol Rep</source>. <year>1999</year>;<volume>85</volume>(<issue>3 Pt 2</issue>):<fpage>1059</fpage>&#x2013;<lpage>69</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.2466/pr0.1999.85.3f.1059">https://doi.org/10.2466/pr0.1999.85.3f.1059</ext-link></mixed-citation></ref>
<ref id="ref43"><label>43</label><mixed-citation publication-type="journal"><string-name><surname>Draper</surname> <given-names>NR</given-names></string-name>, <string-name><surname>Smith</surname> <given-names>H</given-names></string-name>. <article-title>Applied regression analysis</article-title>. <source>3rd edn</source>. <publisher-name>Wiley</publisher-name>; <year>1998</year>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1002/9781118625590">https://doi.org/10.1002/9781118625590</ext-link></mixed-citation></ref>
<ref id="ref44"><label>44</label><mixed-citation publication-type="journal"><string-name><surname>Alexander</surname> <given-names>C</given-names></string-name>. <article-title>Market models: a guide to financial data analysis</article-title>. <source>John Wiley Sons</source>; <year>2001</year>.</mixed-citation></ref>
<ref id="ref45"><label>45</label><mixed-citation publication-type="journal"><string-name><surname>Hippert</surname> <given-names>RC</given-names></string-name>, <string-name><surname>Pedreira</surname> <given-names>HS</given-names></string-name>, <string-name><surname>Souza</surname> <given-names>CE</given-names></string-name>. <article-title>Neural networks for short-term load forecasting: a review and evaluation</article-title>. <source>IEEE Trans Power Syst</source>. <year>2001</year>;<volume>16</volume>(<issue>1</issue>):<fpage>44</fpage>&#x2013;<lpage>55</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/978-3-031-39847-6_1">https://doi.org/10.1007/978-3-031-39847-6_1</ext-link></mixed-citation></ref>
<ref id="ref46"><label>46</label><mixed-citation publication-type="journal"><string-name><surname>Wang</surname> <given-names>C</given-names></string-name>, <string-name><surname>Qin</surname> <given-names>J</given-names></string-name>, <string-name><surname>Chen</surname> <given-names>Y</given-names></string-name>. <article-title>A short-term load forecasting model based on wavelet transform and a hybrid intelligent algorithm</article-title>. <source>Sustainability</source>. <year>2019</year>;<volume>11</volume>(<issue>3</issue>):<fpage>685</fpage>.</mixed-citation></ref>
<ref id="ref47"><label>47</label><mixed-citation publication-type="journal"><string-name><surname>Liu</surname> <given-names>J</given-names></string-name>, <string-name><surname>Sun</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Wu</surname> <given-names>H</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>Z</given-names></string-name>. <article-title>A decision tree-based short-term load forecasting model for electricity markets</article-title>. <source>Energy</source>. <year>2017</year>;<volume>135</volume>:<fpage>739</fpage>&#x2013;<lpage>49</lpage>.</mixed-citation></ref>
<ref id="ref48"><label>48</label><mixed-citation publication-type="journal"><string-name><surname>Singh</surname> <given-names>V</given-names></string-name>, <string-name><surname>Pal</surname> <given-names>SP</given-names></string-name>, <string-name><surname>Sharma</surname> <given-names>R</given-names></string-name>. <article-title>A decision tree based energy forecasting model using smart meter data</article-title>. <source>Procedia Comput Sci</source>. <year>2020</year>;<volume>167</volume>:<fpage>2450</fpage>&#x2013;<lpage>59</lpage>.</mixed-citation></ref>
<ref id="ref49"><label>49</label><mixed-citation publication-type="journal"><string-name><surname>Lahouar</surname> <given-names>JBH</given-names></string-name>, <string-name><surname>Slama</surname> <given-names>A</given-names></string-name>. <article-title>Day-ahead load forecast using random forests and expert input selection</article-title>. <source>Energy Convers Manag</source>. <year>2015</year>;<volume>103</volume>:<fpage>1040</fpage>&#x2013;<lpage>51</lpage>.</mixed-citation></ref>
<ref id="ref50"><label>50</label><mixed-citation publication-type="journal"><string-name><surname>Deb</surname> <given-names>KW</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>C</given-names></string-name>, <string-name><surname>Yang</surname> <given-names>F</given-names></string-name>, <string-name><surname>Lee</surname> <given-names>J</given-names></string-name>, <string-name><surname>Shah</surname> <given-names>SE</given-names></string-name>. <article-title>A review on time series forecasting techniques for building energy consumption</article-title>. <source>Renew Sustain Energy Rev</source>. <year>2017</year>;<volume>74</volume>:<fpage>902</fpage>&#x2013;<lpage>24</lpage>.</mixed-citation></ref>
<ref id="ref51"><label>51</label><mixed-citation publication-type="journal"><string-name><surname>Kuster</surname> <given-names>C</given-names></string-name>, <string-name><surname>Rezgui</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Mourshed</surname> <given-names>M</given-names></string-name>. <article-title>Electrical load forecasting models: a critical systematic review</article-title>. <source>Sustain Cities Soc</source>. <year>2017</year>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.scs.2017.08.009">https://doi.org/10.1016/j.scs.2017.08.009</ext-link></mixed-citation></ref>
<ref id="ref52"><label>52</label><mixed-citation publication-type="journal"><string-name><surname>Suganthi</surname> <given-names>L</given-names></string-name>, <string-name><surname>Samuel</surname> <given-names>AA</given-names></string-name>. <article-title>Energy models for demand forecasting&#x2014;a review</article-title>. <source>Renew Sustain Energy Rev</source>. <year>2012</year>;<volume>16</volume>:<fpage>1223</fpage>&#x2013;<lpage>40</lpage>.</mixed-citation></ref>
<ref id="ref53"><label>53</label><mixed-citation publication-type="journal"><string-name><surname>Marino</surname> <given-names>D</given-names></string-name>, <string-name><surname>Amarasinghe</surname> <given-names>K</given-names></string-name>, <string-name><surname>Manic</surname> <given-names>M</given-names></string-name>. <article-title>Building energy load forecasting using deep neural networks</article-title>. <source>IEEE IECON</source>; <year>2016</year>.</mixed-citation></ref>
<ref id="ref54"><label>54</label><mixed-citation publication-type="journal"><string-name><surname>Kong</surname> <given-names>W</given-names></string-name>, <string-name><surname>Dong</surname> <given-names>ZY</given-names></string-name>, <string-name><surname>Jia</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Hill</surname> <given-names>DJ</given-names></string-name>, <string-name><surname>Xu</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>Y</given-names></string-name>. <article-title>Short-term residential load forecasting based on LSTM recurrent neural network</article-title>. <source>IEEE Transactions on Smart Grid</source>; <year>2017</year>. p. <fpage>841</fpage>&#x2013;<lpage>51</lpage>.</mixed-citation></ref>
<ref id="ref55"><label>55</label><mixed-citation publication-type="journal"><string-name><surname>Liu</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>Z</given-names></string-name>, <string-name><surname>Lin</surname> <given-names>X</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>Z</given-names></string-name>. <article-title>A hybrid model based on GRU for short-term load forecasting</article-title>. <source>Appl Sci</source>. <year>2021</year>.</mixed-citation></ref>
<ref id="ref56"><label>56</label><mixed-citation publication-type="journal"><string-name><surname>Liang</surname> <given-names>X</given-names></string-name>, <string-name><surname>Hu</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Li</surname> <given-names>C</given-names></string-name>, <string-name><surname>Xie</surname> <given-names>Y</given-names></string-name>. <article-title>A novel GRU-based approach for energy load forecasting under multivariate temporal features</article-title>. <source>Energy</source>. <year>2022</year>.</mixed-citation></ref>
<ref id="ref57"><label>57</label><mixed-citation publication-type="journal"><string-name><surname>Hong</surname> <given-names>A</given-names></string-name>, <string-name><surname>Pinson</surname> <given-names>T</given-names></string-name>, <string-name><surname>Fan</surname> <given-names>S</given-names></string-name>, <string-name><surname>Zareipour</surname> <given-names>H</given-names></string-name>, <string-name><surname>Troccoli</surname> <given-names>P</given-names></string-name>. <article-title>Probabilistic energy forecasting: Global Energy Forecasting Competition 2014 and beyond</article-title>. <source>Int J Forecast</source>. <year>2016</year>;<volume>32</volume>:<fpage>896</fpage>&#x2013;<lpage>913</lpage>.</mixed-citation></ref>
<ref id="ref58"><label>58</label><mixed-citation publication-type="journal"><string-name><surname>Taieb</surname> <given-names>SB</given-names></string-name>, <string-name><surname>Hyndman</surname> <given-names>RJ</given-names></string-name>. <article-title>A gradient boosting approach to the Kaggle load forecasting competition</article-title>. <source>Int J Forecast</source>. <year>2014</year>.</mixed-citation></ref>
<ref id="ref59"><label>59</label><mixed-citation publication-type="journal"><string-name><surname>Lahouar</surname> <given-names>A</given-names></string-name>, <string-name><surname>Slama</surname> <given-names>JBH</given-names></string-name>. <article-title>Hourly forecasting of Tunisian electricity demand using random forest</article-title>. <source>Int J Electr Power Energy Syst</source>. <year>2015</year>.</mixed-citation></ref>
<ref id="ref60"><label>60</label><mixed-citation publication-type="journal"><string-name><surname>Zhou</surname> <given-names>K</given-names></string-name>, <string-name><surname>Yang</surname> <given-names>S</given-names></string-name>, <string-name><surname>Shen</surname> <given-names>C</given-names></string-name>. <article-title>A review of electric load classification in smart grid environment</article-title>. <source>Renew Sustain Energy Rev</source>. <year>2013</year>;<volume>24</volume>:<fpage>103</fpage>&#x2013;<lpage>10</lpage>.</mixed-citation></ref>
<ref id="ref61"><label>61</label><mixed-citation publication-type="journal"><string-name><surname>Tymoshenko</surname> <given-names>K</given-names></string-name>, <string-name><surname>Bonadiman</surname> <given-names>D</given-names></string-name>, <string-name><surname>Moschitti</surname> <given-names>A</given-names></string-name>. <article-title>Learning to rank non-factoid answers: comment selection in web forums</article-title>. <source>Int Conf Inf Knowl Manag Proc</source>. <year>2016</year>:<fpage>2049</fpage>&#x2013;<lpage>52</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1145/2983323.2983906">https://doi.org/10.1145/2983323.2983906</ext-link></mixed-citation></ref>
<ref id="ref62"><label>62</label><mixed-citation publication-type="journal"><collab>Wrembel</collab>. <article-title>Data integration revitalized: from data warehouse through data lake to data mesh</article-title>. <publisher-name>Springer</publisher-name>; <year>2023</year>.</mixed-citation></ref>
<ref id="ref63"><label>63</label><mixed-citation publication-type="journal"><string-name><surname>Kelechi</surname> <given-names>AH</given-names></string-name>, <string-name><surname>Alsharif</surname> <given-names>MH</given-names></string-name>, <string-name><surname>Okpe</surname> <given-names>J</given-names></string-name>, <string-name><surname>Ezra</surname> <given-names>PJ</given-names></string-name>, <string-name><surname>Iorshase</surname> <given-names>K</given-names></string-name>, <string-name><surname>Atayero</surname> <given-names>AA</given-names></string-name>, <etal>et al.</etal> <article-title>Artificial intelligence: an energy efficiency tool for enhanced high performance computing</article-title>. <source>Symmetry (Basel)</source>. <year>2020</year>;<volume>12</volume>(<issue>6</issue>):<fpage>1029</fpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3390/SYM12061029">https://doi.org/10.3390/SYM12061029</ext-link></mixed-citation></ref>
<ref id="ref64"><label>64</label><mixed-citation publication-type="journal"><string-name><surname>Brooks</surname> <given-names>C</given-names></string-name>, <string-name><surname>Thompson</surname> <given-names>C</given-names></string-name>. <article-title>Predictive modelling in teaching and learning</article-title>. <source>In: Handbook of learning analytics</source>; <year>2022</year>. p. <fpage>29</fpage>&#x2013;<lpage>37</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.18608/hla22.003">https://doi.org/10.18608/hla22.003</ext-link></mixed-citation></ref>
<ref id="ref65"><label>65</label><mixed-citation publication-type="journal"><string-name><surname>Shiri</surname> <given-names>FM</given-names></string-name>, <string-name><surname>Perumal</surname> <given-names>T</given-names></string-name>, <string-name><surname>Mustapha</surname> <given-names>N</given-names></string-name>, <string-name><surname>Mohamed</surname> <given-names>R</given-names></string-name>. <article-title>A comprehensive overview and comparative analysis on deep learning models: CNN, RNN, LSTM, GRU</article-title>. <source>arXiv:2305.17473</source>; <year>2023</year>.</mixed-citation></ref>
<ref id="ref66"><label>66</label><mixed-citation publication-type="journal"><string-name><surname>Gao</surname> <given-names>S</given-names></string-name>, <string-name><surname>Huang</surname> <given-names>Y</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>S</given-names></string-name>, <string-name><surname>Han</surname> <given-names>J</given-names></string-name>, <string-name><surname>Wang</surname> <given-names>G</given-names></string-name>. <article-title>Short-term runoff prediction with GRU and LSTM networks without requiring time step optimization during sample generation</article-title>. <source>J Hydrol</source>. <year>2020</year>;<volume>589</volume>:<issue>125188</issue>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.jhydrol.2020.125188">https://doi.org/10.1016/j.jhydrol.2020.125188</ext-link></mixed-citation></ref>
<ref id="ref67"><label>67</label><mixed-citation publication-type="journal"><string-name><surname>Bommasani</surname> <given-names>R</given-names></string-name>, <etal>et al.</etal> <article-title>Language models are unsupervised multitask learners</article-title>; <year>2021</year>.</mixed-citation></ref>
<ref id="ref68"><label>68</label><mixed-citation publication-type="journal"><string-name><surname>Van Houdt</surname> <given-names>G</given-names></string-name>, <string-name><surname>Mosquera</surname> <given-names>C</given-names></string-name>, <string-name><surname>N&#x00E1;poles</surname> <given-names>G</given-names></string-name>. <article-title>A review on the long short-term memory model</article-title>. <source>Artif Intell Rev</source>. <year>2020</year>;<volume>53</volume>(<issue>8</issue>):<fpage>5929</fpage>&#x2013;<lpage>55</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1007/s10462-020-09838-1">https://doi.org/10.1007/s10462-020-09838-1</ext-link></mixed-citation></ref>
<ref id="ref69"><label>69</label><mixed-citation publication-type="journal"><string-name><surname>Abdul-Jabbar</surname> <given-names>SS</given-names></string-name>, <string-name><surname>Farhan</surname> <given-names>AK</given-names></string-name>. <article-title>Data analytics and techniques</article-title>. <source>Aro Sci J Koya Univ</source>. <year>2022</year>;<volume>10</volume>(<issue>2</issue>):<fpage>45</fpage>&#x2013;<lpage>55</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.14500/aro.10975">https://doi.org/10.14500/aro.10975</ext-link></mixed-citation></ref>
<ref id="ref70"><label>70</label><mixed-citation publication-type="journal"><string-name><surname>Halverson</surname> <given-names>LR</given-names></string-name>, <string-name><surname>Graham</surname> <given-names>CR</given-names></string-name>, <string-name><surname>Spring</surname> <given-names>KJ</given-names></string-name>, <string-name><surname>Drysdale</surname> <given-names>JS</given-names></string-name>, <string-name><surname>Henrie</surname> <given-names>CR</given-names></string-name>. <article-title>A thematic analysis of the most highly cited scholarship in the first decade of blended learning research</article-title>. <source>Internet High Educ</source>. <year>2014</year>;<volume>20</volume>:<fpage>20</fpage>&#x2013;<lpage>34</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.iheduc.2013.09.004">https://doi.org/10.1016/j.iheduc.2013.09.004</ext-link></mixed-citation></ref>
<ref id="ref71"><label>71</label><mixed-citation publication-type="journal"><string-name><surname>Stas</surname> <given-names>M</given-names></string-name>, <string-name><surname>Van Orshoven</surname> <given-names>J</given-names></string-name>, <string-name><surname>Dong</surname> <given-names>Q</given-names></string-name>, <string-name><surname>Heremans</surname> <given-names>S</given-names></string-name>, <string-name><surname>Zhang</surname> <given-names>B</given-names></string-name>. <article-title>A comparison of machine learning algorithms for regional wheat yield prediction using NDVI time series of SPOT-VGT</article-title>. <source>2016 5th International Conference on Agro-Geoinformatics</source>; <year>2016</year>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1109/Agro-Geoinformatics.2016.7577625">https://doi.org/10.1109/Agro-Geoinformatics.2016.7577625</ext-link></mixed-citation></ref>
<ref id="ref72"><label>72</label><mixed-citation publication-type="journal"><string-name><surname>Mendoza-Bernal</surname> <given-names>J</given-names></string-name>, <string-name><surname>Gonz&#x00E1;lez-Vidal</surname> <given-names>A</given-names></string-name>, <string-name><surname>Skarmeta</surname> <given-names>AF</given-names></string-name>. <article-title>A convolutional neural network approach for image-based anomaly detection in smart agriculture</article-title>. <source>Expert Syst Appl</source>. <year>2024</year>;<volume>247</volume>:<issue>123210</issue>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.eswa.2024.123210">https://doi.org/10.1016/j.eswa.2024.123210</ext-link></mixed-citation></ref>
<ref id="ref73"><label>73</label><mixed-citation publication-type="journal"><string-name><surname>Kumar</surname> <given-names>V</given-names></string-name>, <string-name><surname>Grag</surname> <given-names>ML</given-names></string-name>. <article-title>Predictive analytics: a review of trends and techniques</article-title>. <source>Int J Comput Appl</source>. <year>2018</year>;<volume>182</volume>(<issue>1</issue>):<fpage>31</fpage>&#x2013;<lpage>7</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5120/ijca2018917434">https://doi.org/10.5120/ijca2018917434</ext-link></mixed-citation></ref>
<ref id="ref74"><label>74</label><mixed-citation publication-type="journal"><string-name><surname>Cui</surname> <given-names>M</given-names></string-name>. <article-title>District heating load prediction algorithm based on bidirectional long short-term memory network model</article-title>. <source>Energy</source>. <year>2022</year>;<volume>254</volume>:<issue>124283</issue>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1016/j.energy.2022.124283">https://doi.org/10.1016/j.energy.2022.124283</ext-link></mixed-citation></ref>
</ref-list>
</back>
</article>
