<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.169436.2</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Research Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>GBWOEM: A Gradient-Based Weight Optimization Model for Improved Predictive Accuracy in Healthcare</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 2; peer review: 1 approved, 2 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Das</surname>
                        <given-names>Surajit</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Nayak</surname>
                        <given-names>Samaleswari P.</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Sahoo</surname>
                        <given-names>Biswajit</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-1355-3395</uri>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Champati Rai</surname>
                        <given-names>Satyananda</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-4237-4591</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>School of Computer Engineering, Kalinga Institute of Industrial Technology, Bhubaneswar, Odisha, 751024, India</aff>
                <aff id="a2">
                    <label>2</label>Department of Computer Science and Engineering, Silicon University, Bhubaneswar, Odisha, 751024, India</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:satya.raifcs@kiit.ac.in">satya.raifcs@kiit.ac.in</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>27</day>
                <month>1</month>
                <year>2026</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2025</year>
            </pub-date>
            <volume>14</volume>
            <elocation-id>1161</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>22</day>
                    <month>1</month>
                    <year>2026</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Das S et al.</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/14-1161/pdf"/>
            <abstract>
                <sec>
                    <title>Background</title>
                    <p>The use of ensemble learning has been crucial for improving predictive accuracy in healthcare, especially with regard to critical diagnostic and classification problems. Ensemble models combine the strengths of multiple ML models and reduce the risk of misclassification, which is important in healthcare, where accurate predictions impact patient outcomes.</p>
                </sec>
                <sec>
                    <title>Methods</title>
                    <p>This study introduces the Gradient-Based Weight Optimized Ensemble Model (GBWOEM), an advanced ensemble technique that optimizes the weights of five base models: Decision Tree Classifier (DTC), Random Forest Classifier (RFC), Logistic Regression (LR), Multi-Layer Perceptron (MLP), and K-Nearest Neighbours (KNN), through optimizing the weights. Two variants, GBWOEM-R (random weight initialization) and GBWOEM-U (uniform weight initialization), were proposed and tested on five healthcare-related datasets: breast cancer, Pima Indians Diabetes Database, diabetic retinopathy debrecen, obesity level estimation based on physical condition and eating habits, and thyroid diseases.</p>
                </sec>
                <sec>
                    <title>Results</title>
                    <p>The test accuracy of the proposed models increased to 0.48-8.26% over the traditional ensemble models, such as Adaboost, Catboost, GradientBoost, LightGBM, and XGBoost. Performance metrics, including ROC-AUC analyses, confirmed the model&#x2019;s efficacy in handling imbalanced data, highlighting its potential for advancing predictive consistency in healthcare applications.</p>
                </sec>
                <sec>
                    <title>Conclusion</title>
                    <p>The GBWOEM model improves the predictive accuracy and offers a reliable solution for healthcare applications even when dealing with the imbalance data. This strategy has the potential to ensure patient outcomes and diagnostic consistency in healthcare settings.</p>
                </sec>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Ensemble Learning</kwd>
                <kwd>Healthcare</kwd>
                <kwd>Weight Optimization</kwd>
                <kwd>GBWOEM</kwd>
                <kwd>Classification</kwd>
                <kwd>ROC Curve</kwd>
                <kwd>Machine Learning</kwd>
                <kwd>Predictive Accuracy</kwd>
                <kwd>AUC.</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="https://doi.org/10.13039/501100020612">
                    <funding-source>Kalinga Institute of Industrial Technology</funding-source>
                </award-group>
                <funding-statement>The author(s) declared that no grants were involved in supporting this work.</funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Revised</label>
                <title>Amendments from Version 1</title>
                <p>The manuscript has been modified in response to the reviewers' helpful comments concerning model interpretability, data accuracy, and generalizability. For interpretation ease, we expanded the Results part to numerically demonstrate how the induced weights are controlling the contribution of each base model on top, with updated figures showing comparisons of our method against Random and Uniform weights strategies. With respect to data processing, we have explained our approach to support the use of natural data distributions and proven that the proposed model is capable of learning minority class borders without synthetic oversampling. We additionally introduced a full Train-vs-Test analysis to confirm the high AUC values and exclude overfitting; see new statement in Results section: `the agreement between training-test metrics supports that the model is robust to new data'.</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec id="sec5" sec-type="intro">
            <title>Introduction</title>
            <p>In recent times, the use of ML in healthcare has gained enormous popularity owing to the increasing need for high-quality, timely, and efficient predictions, which are necessary for reliable diagnosis as well as assisting patients and physicians in treatment planning. Given that healthcare is intrinsically steeped in complex, high-stakes decision-making processes, this prediction errors can be catastrophic to patient care. This has led to the need to develop machine learning models that are not only accurate in prediction, but also transparent, generalizable across broad patient populations and practice settings, and robust against small errors in input features. Ensemble learning is a powerful approach among ML methodologies. Ensemble learning improves the overall performance of the system by combining multiple base models to create a single model that strengthens each other while covering their individual.
                <sup>
                    <xref ref-type="bibr" rid="ref1">1</xref>
                </sup> This model aggregation decreases the variance and reduces bias and overfitting. This is particularly important when using healthcare datasets because they are often complex, that is, high-dimensional, noisy, imbalanced, or even insufficient. Therefore, there is an abundance of healthcare applications where ensemble learning has been applied successfully, such as disease prediction, medical image analysis, and patient outcome forecasting.
                <sup>
                    <xref ref-type="bibr" rid="ref2">2</xref>,
                    <xref ref-type="bibr" rid="ref3">3</xref>
                </sup>
            </p>
            <p>Recently, ensemble methods, such as Bagging,
                <sup>
                    <xref ref-type="bibr" rid="ref4">4</xref>
                </sup> Boosting
                <sup>
                    <xref ref-type="bibr" rid="ref5">5</xref>
                </sup> and Stacking,
                <sup>
                    <xref ref-type="bibr" rid="ref6">6</xref>
                </sup> have been the focus of many predictive systems because they promise state-of-the-art performance in many domains. The most obvious bagging technique is the Random Forest, which boosts the stability and accuracy of models by training many weak learners independently and then combining their predictions. Boosting algorithms such as Adaboost, GradientBoost, XGBoost, and Catboost adjust the weights for the current model in some ways and continue throughout the predictions to correct any errors, which improves the accuracy of the overall ensemble. Instead, stacking trains is a metamodel that uses predictions from various base models, which usually results in more sophisticated predictions. When applied in healthcare, they have shown important results, allowing researchers and clinicians to develop models that can more accurately predict disease onset, severity, and treatment effectiveness.</p>
            <p>However, there is scope for improvement in tuning the contribution of each base model to the ensemble. Traditional approaches tend to treat all base models equally or correct model weights using ad-hoc rules. The shrugging of singular complexities existing in healthcare data has, understandably, failed for most. In healthcare applications, an imbalanced dataset is a common issue where the data only have a few positive classes, and if not handled properly, one will come out with a model that has bias. Furthermore, the heterogeneity of healthcare datasets, where feature spaces and data distributions vary widely, presents a significant challenge for traditional ensemble methods.
                <sup>
                    <xref ref-type="bibr" rid="ref7">7</xref>,
                    <xref ref-type="bibr" rid="ref8">8</xref>
                </sup>
            </p>
            <p>To address these challenges, we propose a novel Gradient-Based Weight Optimized Ensemble Model (GBWOEM), which is a self-adjusting ensemble learning model in which the weights of individual base models are dynamically assigned and updated via gradient-based optimization. This method assigns more weight to models that make better predictions and reduces the impact of weaker models to improve the overall performance of the ensemble. The sensitivity of the model is extremely high, which enables the minority class to be predicted more accurately. In our empirical evaluation, two major variants of the model were considered, GBWOEM-R and GBWOEM-U, to study and present a performance comparison with existing models. The key contributions of this study are as follows:
                <list list-type="bullet">
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Developed the Gradient-Based Weight Optimized Ensemble Model (GBWOEM) with two different weight initialization strategies (GBWOEM-R and GBWOEM-U), a novel way to optimize the base model&#x2019;s weights in an ensemble dynamically.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Introduced a log-based loss function with a small constant &#x03b5; to ensure numerical stability and refine the model&#x2019;s performance on imbalanced datasets.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Experiments were conducted on five diverse datasets from the healthcare field, showing that the proposed GBWOEM consistently outperforms popular ensemble models such as Adaboost, Catboost, XGBoost, LightGBM and Gradient Boosting across all cases.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Proved to is robust and adaptable to varying data contexts that show improvements in test accuracy for each of the datasets, ranging from 0.48% to 8.26%.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>We evaluated the relative weights assigned to individual base models in ensemble combinations, giving us useful information about what each contributing base model was doing with respect to the final prediction.</p>
                    </list-item>
                </list>
            </p>
        </sec>
        <sec id="sec6">
            <title>Related work</title>
            <p>Several studies have demonstrated that ensemble models are effective in a range of medical classification tasks. In a study by Younas et al.
                <sup>
                    <xref ref-type="bibr" rid="ref8">8</xref>
                </sup> used a weighted average ensemble technique combining GoogleNet and ResNet-50 to classify colorectal polyps using an augmented dataset (Gastrointestinal Lesions in Regular Colonoscopy and PICCOLO). Their ensemble model outperformed the base models and some other CNN-based deep neural networks, such as Inception-v3, Xception, DenseNet-20, and SqueezeNet. Bhuiyan and Islam
                <sup>
                    <xref ref-type="bibr" rid="ref9">9</xref>
                </sup> used weighted average and maximum voting ensemble techniques to ensemble VGG16, VGG19, and DenseNet201 for malaria classification from red blood cell images. The authors achieved improved performance over weight-based ensemble models and different CNN-ML classifiers. Marques et al.
                <sup>
                    <xref ref-type="bibr" rid="ref10">10</xref>
                </sup> proposed a cross-validation-based ensemble model using EfficientNetB0, averaging predictions across folds, for malaria detection, and achieved superior results compared to other researchers. Ali et al.
                <sup>
                    <xref ref-type="bibr" rid="ref11">11</xref>
                </sup> proposed a bagging-based ensemble model using a DNN to predict problems in the heart. The results of different networks are combined using Logit Boost, which achieves a better performance than Support Vector Machine (SVM), Logistic Regression (LR), Multi-Layer Perceptron (MLP), Random Forest Classifier (RFC), etc. Dutta et al.
                <sup>
                    <xref ref-type="bibr" rid="ref12">12</xref>
                </sup> introduced a weighted average-based ensemble with models such as Gaussian Na&#x00ef;ve Base (GNB), Decision Tree (DT), XGBoost (XGB), Random Forest (RF), and LightGBM (LGB) for early diabetes prediction, although with limited accuracy.</p>
            <p>The boosting-based ensemble model id proposed by Ihnaini et al.
                <sup>
                    <xref ref-type="bibr" rid="ref13">13</xref>
                </sup> to predict diabetes, where trees were used as weak learners, outperforming LR, NB, RF, K-Nearest Neighbour (KNN), DT, and SVM. Reddy et al.
                <sup>
                    <xref ref-type="bibr" rid="ref14">14</xref>
                </sup> used a voting-based ensemble model by combining LR, KNN, RF, DT, and AdaBoost with voting for diabetic retinopathy classification, which outperformed the base models. Habib and Tasnim
                <sup>
                    <xref ref-type="bibr" rid="ref15">15</xref>
                </sup> used the hard voting technique to form an ensemble model by combining LR, NB, RF, and MLP to classify cardiovascular diseases and outperformed the base models. For brain tumor classification, Al Amin et al.
                <sup>
                    <xref ref-type="bibr" rid="ref16">16</xref>
                </sup> used majority voting over ResNet-50, DenseNet121, InceptionV3, VGG19, and VGG16 for brain tumor classification, achieving a higher validation accuracy. El-Sappagh et al.
                <sup>
                    <xref ref-type="bibr" rid="ref17">17</xref>
                </sup> used different ensemble strategies such as majority voting, weighted majority voting, and stacking on the top of different base models such as SVM, MLP, RF, DT, KNN, LR, and XGB for Alzheimer&#x2019;s disease classification, concluding that stacking with XGBoost is most effective. De Souza et al.
                <sup>
                    <xref ref-type="bibr" rid="ref18">18</xref>
                </sup> applied stacking with CNN, LSTM, and CNN-LSTM to anxiety classification. For tuberculosis classification, Osamor and Okezie
                <sup>
                    <xref ref-type="bibr" rid="ref19">19</xref>
                </sup> used a weighted voting ensemble with NB and SVM with PCA and RFE-CV feature selection, achieving notable accuracy despite its simplicity.</p>
            <p>Using a federated learning-based setup, Subashchandrabose et al.
                <sup>
                    <xref ref-type="bibr" rid="ref20">20</xref>
                </sup> proposed a decentralized ensemble model for lung cancer classification and compared its performance with other ML models in both centralized and decentralized architectures, concluding that the proposed model works better in decentralized architecture. Abbas et al.
                <sup>
                    <xref ref-type="bibr" rid="ref21">21</xref>
                </sup> improved lung cancer classification using a weighted federated ensemble, optimizing the weight of the client&#x2019;s ANN using the Levenberg&#x2212; Marquardt and Bayesian regularization techniques, and their weighted sum was used in the server model for the final classification. Kotei and Thirunavukarasu
                <sup>
                    <xref ref-type="bibr" rid="ref22">22</xref>
                </sup> proposed a stacking-based ensemble of nine pre-trained CNN for tuberculosis classification. Despite its high accuracy, the model size and resource utilization are significant. Regarding diabetes classification, Prakash et al.
                <sup>
                    <xref ref-type="bibr" rid="ref23">23</xref>
                </sup> used hard voting with an ANN, RNN, DBN, Perceptron, and RDF, finding it better than Bagging, Boosting, and Stacking. EL-Rashidy et al.
                <sup>
                    <xref ref-type="bibr" rid="ref24">24</xref>
                </sup> proposed a stacking-based ensemble for the classification of mortality using KNN, MLP, LDA, DT, and LR, and stacked them using LR as a meta-learner, showing better results for other ensembles.</p>
            <p>For Covid-19 classification based on Chest X-ray images, Rajaraman et al.
                <sup>
                    <xref ref-type="bibr" rid="ref25">25</xref>
                </sup> proposed an ensemble model using CNN and ImageNet and found that the weighted average is the most efficient. For TB classification Rajaraman and Antani
                <sup>
                    <xref ref-type="bibr" rid="ref26">26</xref>
                </sup> proposed a CNN-based stacking ensemble using pre-trained models, such as Inception-v3, CNN, VGG-16, InceptionReseNet-V2, Xception, and Densenet-121. The model achieved good accuracy at the cost of an increased model size. Juraev et al.
                <sup>
                    <xref ref-type="bibr" rid="ref27">27</xref>
                </sup> accessed different static and dynamic ensemble strategies and concluded that the DESKNN strategy yielded the best results when classic ML models were used as the base models. Anand et al.
                <sup>
                    <xref ref-type="bibr" rid="ref28">28</xref>
                </sup> used a weighted average-based ensemble for the classification of brain tumors using VGG19 and variants of CNN, initializing weights using grid search and achieving better performance than base models.</p>
            <p>Through the survey shown in 
                <xref ref-type="table" rid="T1">
Table 1</xref>, a significant difference in the usage of base models based on the type of data was observed. Researchers have mostly used statistical or other traditional models as base models when working with tabular data, where the data are arranged in rows and columns, such as medical records or diagnostic metrics, whereas CNNs are typically employed as base models for image datasets. The use of CNN-based models results in an increase in the complexity and computational footprint compared with other ensemble models. A range of ensemble techniques, such as averaging, aggregation, weighted averaging, voting, weighted voting, boosting, and bagging, have been used to integrate the results of diverse base models. Of all the mentioned techniques, weighted averaging is one of the most commonly used techniques for combining results owing to its effectiveness in improving ensemble performance.</p>
            <table-wrap id="T1" orientation="portrait" position="float">
                <label>
Table 1. </label>
                <caption>
                    <title>Literature review.</title>
                </caption>
                <table content-type="article-table" frame="hsides">
                    <thead>
                        <tr>
                            <th align="left" colspan="1" rowspan="1" valign="top">Author</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Disease</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Models</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Ensemble technique</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Accuracy</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Observation</th>
                        </tr>
                    </thead>
                    <tbody>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Dutta et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref12">12</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Diabetes</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">GNB, BNB, RF, DT, XGB, LGB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Average</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">73.5</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">The AUC of the base models is taken as weight.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Amin et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref16">16</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Brain Tumor</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">ResNet-50, DenseNet121, InceptionV3, VGG19, VGG16</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">98</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Proposed model outperforms base models.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Habib and Tasnim
                                <sup>
                                    <xref ref-type="bibr" rid="ref15">15</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Cardio vascular Disease</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">LR, GNB, RF, MLP</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">88.42</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Proposed model outperforms base models.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Baha et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref13">13</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Diabetes</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Trees</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Boosting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">99.6</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Proposed ensemble outperforms existing ML models.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Kotei and Thirunavukarasu
                                <sup>
                                    <xref ref-type="bibr" rid="ref22">22</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Tuber-culosis
</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">VGG16, VGG19, InceptionV2, MobileNet, Xception, Densenet, EfficientNEtB1, Resnet50, InceptionV3, CNN</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Stacking</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">98.38</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Too many CNN-based models increase the complexity and computational footprint.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Younas et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref8">8</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Colorectal Cancer</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">GoogleNet, ResNet-50</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Average</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">96.3</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Grid search is used for weight initialization.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Ali et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref11">11</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Heart Disease</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">DNN, LogitBoost</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Average</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">98.5</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">All the experimental models gave their respective highest accuracy at the same feature count.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Juraev et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref27">27</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Mortality</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">DT, LR, Linear SVR, KNN, Lidge, Lasso, CB, XGB, RF, GB, LGBM</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">98.7</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Traditional ensemble models as base model reduces the model gives better performance.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Reddy et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref14">14</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Diabetic Retinopathy</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">LR, DT, KNN, RF, Adaboost</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">82</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Proposed model outperforms base models.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Marques et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref10">10</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Malaria</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">EfficientNetB0</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Averaging</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">98.29</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Average of 10-fold cross-validation is used.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Bhuiyan and Islam
                                <sup>
                                    <xref ref-type="bibr" rid="ref9">9</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Malaria</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">VGG16, VGG19, DenseNet201</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Average, Max Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">97.92</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Proposed model outperforms base models.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">EL-Rashidy et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref24">24</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Mortality</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">KNN, MLP, LDA, DT, LR</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Stacking</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">94.4</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Performs better than existing ensembles.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Prakash et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref23">23</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Diabetes</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">ANN, RNN, DBN, Perceptron, RDF</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">92</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Voting is giving better results than the other ensemble techniques.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Abbas et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref21">21</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Lung Cancer</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">ANN</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Sum</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">96.3</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Model works better only in distributed system.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Shaker et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref17">17</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Alzheimer&#x2019;s disease</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">SVM, MLP, RF, DT, KNN, LR, XGB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Majority voting, Weighted majority voting, stacking</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">89.15</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Stacking with XGB performs better than the other setups.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Rajaraman and Antani
                                <sup>
                                    <xref ref-type="bibr" rid="ref26">26</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Tuber-culosis
</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Xception, Densenet-121, CNN, VGG-16, Inception-v3, InceptionReseNet-V2</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Stacking</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">94.1</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">So many pre-trained models increase the computational footprint.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Rajaraman et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref25">25</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Covid-19</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">CNN, ImageNet</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Average</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">99.01</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted average with pruned CNN model performs better.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Subashchandrabose et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref20">20</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Lung Cancer</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">NN</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">-</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">89.63</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">The centralized approach gave a better result than the decentralized approach.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Souza et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref18">18</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Anxiety</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">CNN, LSTM</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Stacking</td>
                            <td colspan="1" rowspan="1"/>
                            <td align="left" colspan="1" rowspan="1" valign="top">A blend of CNN, LSTM, and CNN-LSTM with stacking gave less error than others.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Anand et al.
                                <sup>
                                    <xref ref-type="bibr" rid="ref28">28</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Brain Tumor</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">VGG19, CNN</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Average</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">98</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Grid search is used for weight initialization.</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Osamor and Okezie
                                <sup>
                                    <xref ref-type="bibr" rid="ref19">19</xref>
                                </sup>
                            </td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Tuber-culosis
</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">NB, SVM</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Weighted Voting</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">96</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Simple ensemble model with better performance.</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
        </sec>
        <sec id="sec7">
            <title>Proposed methodology</title>
            <p>A new Gradient-Based Weight Optimized Ensemble Model (GBWOEM), which uses a variety of base models to improve prediction performance, has been introduced. 
                <xref ref-type="fig" rid="f1">
Figure 1</xref> provides a full overview of the GBWOEM&#x2019;s design. A dataset is first obtained from the UCI repository, and then extensive Exploratory Data Analysis (EDA), pre-processing, data transformation, and normalization are performed to ensure that the data are ready for modelling. To enable extensive model evaluation and performance assessment, the dataset was divided into training, validation, and testing sets. We chose five diverse base models for the ensemble model, each representing a different modelling approach: Logistic Regression (LR) for statistical strength, Decision Tree Classifier (DTC) for interpretability, Random Forest Classifier (RFC) for robustness and ensemble capabilities, Multi-Layer Perceptron (MLP) for deep learning, and K-Nearest Neighbours (KNN) for distance-based methodology.</p>
            <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                <label>
Figure 1. </label>
                <caption>
                    <title>Proposed methodology.</title>
                </caption>
                <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure1.gif"/>
            </fig>
            <p>Grid Search is used to improve hyperparameters for each of these foundation models, and K-Fold Cross-Validation is used to guarantee generalization across various training data subsets. Five separately optimized models are the end product of this method. The GBWOEM iteratively selects combinations of base models (
                <inline-formula>

                    <mml:math display="inline">
                        <mml:msub>
                            <mml:msub>
                                <mml:mn>5</mml:mn>
                                <mml:mi>C</mml:mi>
                            </mml:msub>
                            <mml:mn>2</mml:mn>
                        </mml:msub>
                        <mml:mo>,</mml:mo>
                        <mml:msub>
                            <mml:msub>
                                <mml:mn>5</mml:mn>
                                <mml:mi>C</mml:mi>
                            </mml:msub>
                            <mml:mn>3</mml:mn>
                        </mml:msub>
                        <mml:mo>,</mml:mo>
                        <mml:msub>
                            <mml:msub>
                                <mml:mn>5</mml:mn>
                                <mml:mi>C</mml:mi>
                            </mml:msub>
                            <mml:mn>4</mml:mn>
                        </mml:msub>
                        <mml:mo>,</mml:mo>
                        <mml:mtext mathvariant="normal">and</mml:mtext>
                        <mml:mspace width="0.25em"/>
                        <mml:msub>
                            <mml:msub>
                                <mml:mn>5</mml:mn>
                                <mml:mi>C</mml:mi>
                            </mml:msub>
                            <mml:mn>5</mml:mn>
                        </mml:msub>
                    </mml:math>
</inline-formula>) or Weighted Average Models (WAM) using the five optimized models that are input. Using the validation dataset, the GBWOEM adjusts the weights of the chosen base models during each iteration to ascertain their respective contributions to the ensemble. The effectiveness of the ensemble is then determined by evaluating its performance on a test dataset. The combinatorial possibilities of choosing various subsets of the five base models yields 26 potential combinations because of the GBWOEM method. By assessing the performance of every combination on the test set, GBWOEM determines the ensemble configuration that enhances the accuracy of the predictions. With a combination of statistical, distance-based, tree-based, and neural network techniques, the final model is chosen based on best predictive performance out of all the basic models.</p>
            <sec id="sec8">
                <title>Datasets</title>
                <p>While developing a model, it is important to evaluate its performance on a variety of datasets. Different datasets represent different disease domains such as diabetes, cancer, thyroid, and obesity. Each dataset has distinct properties, including differences in feature types, noise level, and distribution. Testing the model&#x2019;s performance across these broad domains helps determine the model&#x2019;s ability to generalize new data. Using different datasets with diverse qualities and dimensions, evaluate the model&#x2019;s robustness and determine whether the model consistently performs well or is impacted by the nature of the data. It can identify areas where the model can be improved, such as by handling imbalanced data or dealing with noise. The analysis of performance inconsistencies can aid in model adjustment and fine-tuning. Information regarding the datasets used in this experiment is presented in 
                    <xref ref-type="table" rid="T2">
Table 2</xref>.</p>
                <table-wrap id="T2" orientation="portrait" position="float">
                    <label>
Table 2. </label>
                    <caption>
                        <title>Information of the dataset.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Name of the datasets</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Number of instances</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Number of features</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Target variable</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Data distribution</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Missing value present?</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Feature type</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Breast Cancer Dataset 
(BC DS)
                                    <sup>
                                        <xref ref-type="bibr" rid="ref30">29</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">569</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">32</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Diagnosis
                                    <break/>Malignant/M = 1
                                    <break/>Benign/B = 0</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1: 37.3%
                                    <break/>0: 62.7%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">No</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Numerical</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Diabetic Retinopathy Debrecen 
(DRD DS)
                                    <sup>
                                        <xref ref-type="bibr" rid="ref31">30</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1151</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">20</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Diabetic Retinopathy (1, 0)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1: 52.9%
                                    <break/>0: 47.1%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">No</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Numerical</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Pima Indians Diabetes Database 
(PID DS)
                                    <sup>
                                        <xref ref-type="bibr" rid="ref32">31</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">768</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">9</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Outcome (1, 0)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1: 34.9%
                                    <break/>0: 65.1%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Yes</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Numerical</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Obesity Dataset 
(OL DS)
                                    <sup>
                                        <xref ref-type="bibr" rid="ref33">32</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2111</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">17</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Obesity Level
                                    <break/>Normal (0), Obesity (1)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1: 46.6%
                                    <break/>0: 53.4%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">No</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Numerical, Categorical</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Thyroid Disease 
(TH DS)
                                    <sup>
                                        <xref ref-type="bibr" rid="ref34">33</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3772</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">30</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Thyroid Disease (1, 0)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1: 91.8%
                                    <break/>0: 8.2%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Yes</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Numerical, Categorical</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec id="sec9">
                <title>Base models</title>
                <p>An ensemble model in machine learning makes predictions by combining several &#x201c;base learners&#x201d; or &#x201c;base estimators&#x201d;, each of which performs a classification or prediction task. In our proposed work, to build the GBWOEM, Decision Tree Classifier (DTC), Logistic Regression (LR), Random Forest Classifier (RFC), K-Nearest Neighbour (KNN), and Multi-Layer Perceptron (MLP) is used.</p>
                <p>
LR is a widely used empirical model in clinical analyses. It serves multiple purposes, including classification and feature selection, and as a meta-learner in ensemble models.
                    <sup>
                        <xref ref-type="bibr" rid="ref35">34</xref>&#x2013;
                        <xref ref-type="bibr" rid="ref37">36</xref>
                    </sup> As a supervised ML algorithm, binary classification is the primary application of LR. It evaluates the relationship between one or more independent variables and categorizes data into distinct classes. Decision trees are used in complex decision-making processes or to predict patient outcomes based on features from large datasets.
                    <sup>
                        <xref ref-type="bibr" rid="ref38">37</xref>&#x2013;
                        <xref ref-type="bibr" rid="ref40">39</xref>
                    </sup> The trees divide data on the basis of feature values and provide optimal decisions with respect to certain criteria, for example, Gini impurity 
                    <inline-formula>

                        <mml:math display="inline">
                            <mml:mi>G</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mn>1</mml:mn>
                            <mml:mo>&#x2212;</mml:mo>
                            <mml:munderover>
                                <mml:mo>&#x2211;</mml:mo>
                                <mml:mrow>
                                    <mml:mi>i</mml:mi>
                                    <mml:mo>=</mml:mo>
                                    <mml:mn>1</mml:mn>
                                </mml:mrow>
                                <mml:mi>n</mml:mi>
                            </mml:munderover>
                            <mml:msubsup>
                                <mml:mi>p</mml:mi>
                                <mml:mi>i</mml:mi>
                                <mml:mn>2</mml:mn>
                            </mml:msubsup>
                        </mml:math>
</inline-formula> or information gain 
                    <inline-formula>

                        <mml:math display="inline">
                            <mml:mi>IG</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mi mathvariant="normal">H</mml:mi>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi mathvariant="normal">Y</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>&#x2212;</mml:mo>
                            <mml:mi mathvariant="normal">H</mml:mi>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi mathvariant="normal">Y</mml:mi>
                                <mml:mo>|</mml:mo>
                                <mml:mi mathvariant="normal">X</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
</inline-formula>, where H is entropy and p
                    <sub>i</sub> is the probability of class. A data point is assigned with a label of the majority class among its k nearest neighbours by the k-NN algorithm, where k is a user-specified hyperparameter. It matches these neighbours using distance metrics, such as the Euclidean distance 
                    <inline-formula>

                        <mml:math display="inline">
                            <mml:mi>d</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:msqrt>
                                <mml:mrow>
                                    <mml:munderover>
                                        <mml:mo>&#x2211;</mml:mo>
                                        <mml:mrow>
                                            <mml:mi>i</mml:mi>
                                            <mml:mo>=</mml:mo>
                                            <mml:mn>1</mml:mn>
                                        </mml:mrow>
                                        <mml:mi>n</mml:mi>
                                    </mml:munderover>
                                    <mml:msup>
                                        <mml:mrow>
                                            <mml:mo stretchy="true">(</mml:mo>
                                            <mml:msub>
                                                <mml:mi>x</mml:mi>
                                                <mml:mi>i</mml:mi>
                                            </mml:msub>
                                            <mml:mo>&#x2212;</mml:mo>
                                            <mml:msub>
                                                <mml:mi>y</mml:mi>
                                                <mml:mi>i</mml:mi>
                                            </mml:msub>
                                            <mml:mo stretchy="true">)</mml:mo>
                                        </mml:mrow>
                                        <mml:mn>2</mml:mn>
                                    </mml:msup>
                                </mml:mrow>
                            </mml:msqrt>
                            <mml:mo>.</mml:mo>
                        </mml:math>
</inline-formula>
                    <sup>
                        <xref ref-type="bibr" rid="ref41">40</xref>
                    </sup> Methods such as bagging and boosting can be utilized with k-NN to develop more robust models that reduce noise sensitivity and improve the accuracy.
                    <sup>
                        <xref ref-type="bibr" rid="ref42">41</xref>
                    </sup> Random Forests combines multiple decision trees trained on bootstrap samples with a random subset of features,
                    <sup>
                        <xref ref-type="bibr" rid="ref43">42</xref>
                    </sup> significantly reducing overfitting.
                    <sup>
                        <xref ref-type="bibr" rid="ref44">43</xref>
                    </sup> Taking this into consideration in the field of healthcare, it can be utilized with tasks pertaining to disease classification, risk prediction, and patient outcome forecasting. MLPs are deep learning models capable of performing complicated classification and regression tasks because their ability is to represent complex non-linear relationships using multiple layers of neurons.
                    <sup>
                        <xref ref-type="bibr" rid="ref45">44</xref>
                    </sup> Using backpropagation and gradient descent, it minimizes a loss function and subsequently the network learns, where the loss function for classification tasks might be cross-entropy 
                    <inline-formula>

                        <mml:math display="inline">
                            <mml:mi>L</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mo>&#x2212;</mml:mo>
                            <mml:munderover>
                                <mml:mo>&#x2211;</mml:mo>
                                <mml:mrow>
                                    <mml:mi>i</mml:mi>
                                    <mml:mo>=</mml:mo>
                                    <mml:mn>1</mml:mn>
                                </mml:mrow>
                                <mml:mi>n</mml:mi>
                            </mml:munderover>
                            <mml:mspace width="0.25em"/>
                            <mml:msub>
                                <mml:mi>y</mml:mi>
                                <mml:mi>i</mml:mi>
                            </mml:msub>
                            <mml:mo>log</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mover accent="true">
                                    <mml:msub>
                                        <mml:mi>y</mml:mi>
                                        <mml:mi>i</mml:mi>
                                    </mml:msub>
                                    <mml:mo stretchy="true">&#x0302;</mml:mo>
                                </mml:mover>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
</inline-formula> and for regression tasks, it might be MSE. The activation functions used in the hidden layers, such as ReLU or sigmoid MLP, introduce non-linearity,
                    <sup>
                        <xref ref-type="bibr" rid="ref46">45</xref>
                    </sup> allowing them to pick up complex patterns in the data.</p>
                <p>LR, DT, kNN, RF, and MLP were considered for our ensemble model. While LR models can only capture linear relationships, DTs describe non-linear interactions and variable importance. Although RFs improve ensemble performance by combining many decision trees, they are designed to promote generalization over a wide range of datasets. MLPs can capture highly non-linear relationships in large datasets with relatively complex feature representations. The KNN learns the local structure and variance, leading to fine-grained predictions based on data closeness.</p>
            </sec>
            <sec id="sec10">
                <title>GBWOEM</title>
                <p>The Gradient-Based Weight Optimized Ensemble Model (GBWOEM) is a weighted average-based ensemble model that integrates five diverse base models: LR, DT, KNN, RF, and MLP. 
                    <xref ref-type="fig" rid="f2">
Figure 2</xref> shows a flowchart of the algorithm. The ensemble approach harnesses the strengths of each base model, and the final prediction is calculated by averaging the outputs with appropriate weights. GBWOEM assigns and updates weights to each base model in a systematic manner based on the performance of the base models. The entire process begins by training the base models. Every base model is trained rigorously using a grid search CV along with k-folds to extract the best model out of all variations. The model with the best accuracy among the trained models is selected as the initial candidate that will undergo optimization through the GBWOEM algorithm.</p>
                <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                    <label>
Figure 2. </label>
                    <caption>
                        <title>Process flow of GBOWEM.</title>
                    </caption>
                    <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure2.gif"/>
                </fig>
                <p>The first step in weight optimization is to establish the weights for every base model using two modes, GBWOEM-R, where the weights are randomly initialized and normalized to keep their sum equal to one. Alternatively, in GBWOEM-U, the weights are initialized uniformly. After the weight assignment, other hyper-parameters, including learning rate, number of iterations, and a patience parameter to stop early, are initialized. Subsequently, with these initial weights, the ensemble provides its first predictions based on the initial results and evaluates the ensemble using a loss function, which includes both training and validation losses. When the model fails to meet an early stopping condition, that is, if the validation loss does not improve within a certain number of iterations, the training is terminated so that overfitting can be avoided. However, if the stopping condition is not satisfied, the next phase involves calculating the gradient of the loss function with respect to the weights of the base models. Subsequently, the weights are updated using a gradient descent optimization technique to reduce the overall ensemble loss. This process is continued until the maximum number of iterations is reached, or the early stopping condition is met. The process is described in 
                    <xref ref-type="boxed-text" rid="B1">Algorithm 1</xref>.</p>
                <boxed-text id="B1" orientation="portrait" position="float">
                    <label>Algorithm 1. </label>
                    <caption>
                        <title>Gradient Based Weight Optimized Ensemble Model (GBWOEM).</title>
                    </caption>
                    <p>

                        <table-wrap id="T3" orientation="portrait" position="anchor">
                            <table content-type="article-table" frame="hsides">
                                <tbody>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <bold>Input:</bold>
</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <p>

                                                <list list-type="bullet">
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Learning rate (
                                                            <italic toggle="yes">&#x03b1;</italic>)</p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Number of iterations (
                                                            <italic toggle="yes">num iterations</italic>)</p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Patience for early stopping (
                                                            <italic toggle="yes">patience</italic>)</p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Weight initializer method (
                                                            <italic toggle="yes">weight initializer</italic>)</p>
                                                    </list-item>
                                                </list>
                                            </p>
</td>
                                    </tr>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <bold>Output:</bold>
</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <p>

                                                <list list-type="bullet">
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Trained ensemble model with optimized weights</p>
                                                    </list-item>
                                                </list>
                                            </p>
</td>
                                    </tr>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <bold>Parameters:</bold>
</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <p>

                                                <list list-type="bullet">
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Number of base models: n</p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Base models: 
                                                            <inline-formula>

                                                                <mml:math display="inline">
                                                                    <mml:mrow>
                                                                        <mml:mo stretchy="true">{</mml:mo>
                                                                        <mml:msub>
                                                                            <mml:mi>M</mml:mi>
                                                                            <mml:mn>1</mml:mn>
                                                                        </mml:msub>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msub>
                                                                            <mml:mi>M</mml:mi>
                                                                            <mml:mn>2</mml:mn>
                                                                        </mml:msub>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:mo>&#x2026;</mml:mo>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msub>
                                                                            <mml:mi>M</mml:mi>
                                                                            <mml:mi>n</mml:mi>
                                                                        </mml:msub>
                                                                        <mml:mo stretchy="true">}</mml:mo>
                                                                    </mml:mrow>
                                                                </mml:math>
</inline-formula>
                                                        </p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Ensemble predictions on training set: 
                                                            <inline-formula>

                                                                <mml:math display="inline">
                                                                    <mml:mrow>
                                                                        <mml:mo stretchy="true">{</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mn>1</mml:mn>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mn>2</mml:mn>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:mo>&#x2026;</mml:mo>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mi>n</mml:mi>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo stretchy="true">}</mml:mo>
                                                                    </mml:mrow>
                                                                </mml:math>
</inline-formula>
                                                        </p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Ensemble predictions on validation set: 
                                                            <inline-formula>

                                                                <mml:math display="inline">
                                                                    <mml:mrow>
                                                                        <mml:mo stretchy="true">{</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mi mathvariant="italic">val</mml:mi>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mn>1</mml:mn>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mi mathvariant="italic">val</mml:mi>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mn>2</mml:mn>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:mo>&#x2026;</mml:mo>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mi mathvariant="italic">val</mml:mi>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mi>n</mml:mi>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo stretchy="true">}</mml:mo>
                                                                    </mml:mrow>
                                                                </mml:math>
</inline-formula>
                                                        </p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Ensemble predictions on test set: 
                                                            <inline-formula>

                                                                <mml:math display="inline">
                                                                    <mml:mrow>
                                                                        <mml:mo stretchy="true">{</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mtext mathvariant="italic">test</mml:mtext>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mn>1</mml:mn>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mtext mathvariant="italic">test</mml:mtext>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mn>2</mml:mn>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:mo>&#x2026;</mml:mo>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msubsup>
                                                                            <mml:mover accent="true">
                                                                                <mml:mi>Y</mml:mi>
                                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                                            </mml:mover>
                                                                            <mml:mtext mathvariant="italic">test</mml:mtext>
                                                                            <mml:mrow>
                                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                                <mml:mi>n</mml:mi>
                                                                                <mml:mo stretchy="true">)</mml:mo>
                                                                            </mml:mrow>
                                                                        </mml:msubsup>
                                                                        <mml:mo stretchy="true">}</mml:mo>
                                                                    </mml:mrow>
                                                                </mml:math>
</inline-formula>
                                                        </p>
                                                    </list-item>
                                                    <list-item>
                                                        <label>-</label>
                                                        <p>Weights: 
                                                            <inline-formula>

                                                                <mml:math display="inline">
                                                                    <mml:mi>W</mml:mi>
                                                                    <mml:mrow>
                                                                        <mml:mo stretchy="true">{</mml:mo>
                                                                        <mml:msub>
                                                                            <mml:mi>w</mml:mi>
                                                                            <mml:mn>1</mml:mn>
                                                                        </mml:msub>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msub>
                                                                            <mml:mi>w</mml:mi>
                                                                            <mml:mn>2</mml:mn>
                                                                        </mml:msub>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:mo>&#x2026;</mml:mo>
                                                                        <mml:mo>,</mml:mo>
                                                                        <mml:msub>
                                                                            <mml:mi>w</mml:mi>
                                                                            <mml:mi>n</mml:mi>
                                                                        </mml:msub>
                                                                        <mml:mo stretchy="true">}</mml:mo>
                                                                    </mml:mrow>
                                                                </mml:math>
</inline-formula>
                                                        </p>
                                                    </list-item>
                                                </list>
                                            </p>
</td>
                                    </tr>
                                    <tr>
                                        <td align="left" colspan="2" rowspan="1" valign="top">1.&#x2003;If weight_initializer == &#x2018;random&#x2019;:
                                            <break/>2.&#x2003;&#x2003;W = [n random number sampled uniformly from [0,1)]
                                            <break/>3.&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msub>
                                                        <mml:mi>W</mml:mi>
                                                        <mml:mtext mathvariant="italic">normalized</mml:mtext>
                                                    </mml:msub>
                                                </mml:math>
</inline-formula> = 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:mfrac>
                                                        <mml:mi>W</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo>&#x2211;</mml:mo>
                                                            <mml:mi>W</mml:mi>
                                                        </mml:mrow>
                                                    </mml:mfrac>
                                                </mml:math>
</inline-formula>

                                            <break/>4.&#x2003;&#x2003;W = 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msub>
                                                        <mml:mi>W</mml:mi>
                                                        <mml:mtext mathvariant="italic">normalized</mml:mtext>
                                                    </mml:msub>
                                                </mml:math>
</inline-formula>

                                            <break/>5.&#x2003;Else If weight_initializer == &#x2018;uniform&#x2019;:
                                            <break/>6.&#x2003;&#x2003;W = ones_array/n
                                            <break/>7.&#x2003;Else:
                                            <break/>8.&#x2003;&#x2003;Value Error
                                            <break/>9.&#x2003;For each base model 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msub>
                                                        <mml:mi>M</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                    </mml:msub>
                                                    <mml:mo>:</mml:mo>
                                                </mml:math>
</inline-formula>

                                            <break/>10.&#x2003;&#x2003;Fit 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msub>
                                                        <mml:mi>M</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                    </mml:msub>
                                                </mml:math>
</inline-formula> on training data (
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msub>
                                                        <mml:mi>X</mml:mi>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                    </mml:msub>
                                                    <mml:mo>,</mml:mo>
                                                    <mml:msub>
                                                        <mml:mi>Y</mml:mi>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                    </mml:msub>
                                                </mml:math>
</inline-formula>)
                                            <break/>11.&#x2003;&#x2003;Predict probabilities for 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msub>
                                                        <mml:mi>X</mml:mi>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                    </mml:msub>
                                                    <mml:mo>,</mml:mo>
                                                    <mml:msub>
                                                        <mml:mi>X</mml:mi>
                                                        <mml:mi mathvariant="italic">val</mml:mi>
                                                    </mml:msub>
                                                    <mml:mo>,</mml:mo>
                                                    <mml:msub>
                                                        <mml:mi>X</mml:mi>
                                                        <mml:mtext mathvariant="italic">test</mml:mtext>
                                                    </mml:msub>
                                                </mml:math>
</inline-formula>

                                            <break/>12.&#x2003;&#x2003;Store Predictions 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>,</mml:mo>
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mn>2</mml:mn>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>,</mml:mo>
                                                    <mml:mo>&#x2026;</mml:mo>
                                                    <mml:mo>,</mml:mo>
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>n</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                </mml:math>
</inline-formula>

                                            <break/>13.&#x2003;For iteration t in range (num_iterations):
                                            <break/>14.&#x2003;&#x2003;Compute ensemble predictions using current weights:
                                            <break/>15.&#x2003;&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mrow>
                                                            <mml:mtext mathvariant="italic">ensemble</mml:mtext>
                                                            <mml:mo>,</mml:mo>
                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        </mml:mrow>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:msubsup>
                                                        <mml:mi>w</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>.</mml:mo>
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:math>
</inline-formula>

                                            <break/>16.&#x2003;&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mrow>
                                                            <mml:mtext mathvariant="italic">ensemble</mml:mtext>
                                                            <mml:mo>,</mml:mo>
                                                            <mml:mi mathvariant="italic">val</mml:mi>
                                                        </mml:mrow>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:msubsup>
                                                        <mml:mi>w</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>.</mml:mo>
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mi mathvariant="italic">val</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:math>
</inline-formula>

                                            <break/>17.&#x2003;&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mrow>
                                                            <mml:mtext mathvariant="italic">ensemble</mml:mtext>
                                                            <mml:mo>,</mml:mo>
                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        </mml:mrow>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:msubsup>
                                                        <mml:mi>w</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>.</mml:mo>
                                                    <mml:msubsup>
                                                        <mml:mover accent="true">
                                                            <mml:mi>Y</mml:mi>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mtext mathvariant="italic">test</mml:mtext>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:math>
</inline-formula>

                                            <break/>18.&#x2003;&#x2003;Computing training and validation loss:
                                            <break/>19.&#x2003;&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mtext mathvariant="italic">loss</mml:mtext>
                                                        <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mtext mathvariant="italic">Loss</mml:mtext>
                                                    <mml:mo>_</mml:mo>
                                                    <mml:mtext mathvariant="italic">Function</mml:mtext>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:msub>
                                                            <mml:mi>y</mml:mi>
                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        </mml:msub>
                                                        <mml:mo>,</mml:mo>
                                                        <mml:msubsup>
                                                            <mml:mover accent="true">
                                                                <mml:mi>Y</mml:mi>
                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                            </mml:mover>
                                                            <mml:mrow>
                                                                <mml:mtext mathvariant="italic">ensemble</mml:mtext>
                                                                <mml:mo>,</mml:mo>
                                                                <mml:mtext mathvariant="italic">train</mml:mtext>
                                                            </mml:mrow>
                                                            <mml:mrow>
                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                <mml:mi>t</mml:mi>
                                                                <mml:mo stretchy="true">)</mml:mo>
                                                            </mml:mrow>
                                                        </mml:msubsup>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                </mml:math>
</inline-formula>

                                            <break/>20.&#x2003;&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mtext mathvariant="italic">loss</mml:mtext>
                                                        <mml:mi mathvariant="italic">val</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mtext mathvariant="italic">Loss</mml:mtext>
                                                    <mml:mo>_</mml:mo>
                                                    <mml:mtext mathvariant="italic">Function</mml:mtext>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:msub>
                                                            <mml:mi>y</mml:mi>
                                                            <mml:mi mathvariant="italic">val</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo>,</mml:mo>
                                                        <mml:msubsup>
                                                            <mml:mover accent="true">
                                                                <mml:mi>Y</mml:mi>
                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                            </mml:mover>
                                                            <mml:mrow>
                                                                <mml:mtext mathvariant="italic">ensemble</mml:mtext>
                                                                <mml:mo>,</mml:mo>
                                                                <mml:mi mathvariant="italic">val</mml:mi>
                                                            </mml:mrow>
                                                            <mml:mrow>
                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                <mml:mi>t</mml:mi>
                                                                <mml:mo stretchy="true">)</mml:mo>
                                                            </mml:mrow>
                                                        </mml:msubsup>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                </mml:math>
</inline-formula>

                                            <break/>21.&#x2003;Early Stopping:
                                            <break/>22.&#x2003;&#x2003;If 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mtext mathvariant="italic">loss</mml:mtext>
                                                        <mml:mi mathvariant="italic">val</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>&lt;</mml:mo>
                                                    <mml:mi mathvariant="italic">bes</mml:mi>
                                                    <mml:msub>
                                                        <mml:mi>t</mml:mi>
                                                        <mml:mtext mathvariant="italic">loss</mml:mtext>
                                                    </mml:msub>
                                                </mml:math>
</inline-formula>:
                                            <break/>23.&#x2003;&#x2003;&#x2003;best_loss = 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:msubsup>
                                                        <mml:mtext mathvariant="italic">loss</mml:mtext>
                                                        <mml:mi mathvariant="italic">val</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mo stretchy="true">(</mml:mo>
                                                            <mml:mi>t</mml:mi>
                                                            <mml:mo stretchy="true">)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:msubsup>
                                                    <mml:mo>,</mml:mo>
                                                </mml:math>
</inline-formula>best_weights = current_weight, Count = 0
                                            <break/>24.&#x2003;Else:
                                            <break/>25.&#x2003;&#x2003;count = count + 1
                                            <break/>26.&#x2003;If count &gt;= patience: Break
                                            <break/>27.&#x2003;Compute gradient of loss w.r.t. weights:
                                            <break/>28.&#x2003;&#x2003;
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:mo>&#x2207;</mml:mo>
                                                    <mml:mi mathvariant="normal">L</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mfrac>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mi>N</mml:mi>
                                                    </mml:mfrac>
                                                    <mml:mo>.</mml:mo>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:msubsup>
                                                            <mml:mover accent="true">
                                                                <mml:mi>Y</mml:mi>
                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                            </mml:mover>
                                                            <mml:mrow>
                                                                <mml:mtext mathvariant="italic">ensemble</mml:mtext>
                                                                <mml:mo>,</mml:mo>
                                                                <mml:mtext mathvariant="italic">train</mml:mtext>
                                                            </mml:mrow>
                                                            <mml:mrow>
                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                <mml:mi>t</mml:mi>
                                                                <mml:mo stretchy="true">)</mml:mo>
                                                            </mml:mrow>
                                                        </mml:msubsup>
                                                        <mml:mo>&#x2212;</mml:mo>
                                                        <mml:msub>
                                                            <mml:mi>y</mml:mi>
                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                        </mml:msub>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                    <mml:mo>.</mml:mo>
                                                    <mml:msup>
                                                        <mml:msubsup>
                                                            <mml:mover accent="true">
                                                                <mml:mi>Y</mml:mi>
                                                                <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                            </mml:mover>
                                                            <mml:mtext mathvariant="italic">train</mml:mtext>
                                                            <mml:mrow>
                                                                <mml:mo stretchy="true">(</mml:mo>
                                                                <mml:mi>t</mml:mi>
                                                                <mml:mo stretchy="true">)</mml:mo>
                                                            </mml:mrow>
                                                        </mml:msubsup>
                                                        <mml:mi>T</mml:mi>
                                                    </mml:msup>
                                                </mml:math>
</inline-formula>

                                            <break/>29.&#x2003;Update weighs using gradient descent:
                                            <break/>30.&#x2003;&#x2003;current_weights = current_weights - 
                                            <inline-formula>

                                                <mml:math display="inline">
                                                    <mml:mi>&#x03b1;</mml:mi>
                                                    <mml:mo>.</mml:mo>
                                                    <mml:mo>&#x2207;</mml:mo>
                                                    <mml:mi mathvariant="normal">L</mml:mi>
                                                </mml:math>
</inline-formula>
</td>
                                    </tr>
                                </tbody>
                            </table>
                        </table-wrap>
                    </p>
                </boxed-text>
                <p>Gradient descent is the key component of our proposed algorithm, which optimizes the ensemble model by minimizing the custom loss function. By penalizing inaccurate predictions more severely, particularly when the model is overconfident, the binary-cross-entropy-based loss function (
                    <xref ref-type="disp-formula" rid="e1">
Equation 1</xref>) ensures that the model can handle classification tasks effectively.
                    <disp-formula id="e1">

                        <mml:math display="block">
                            <mml:msub>
                                <mml:mtext mathvariant="italic">loss</mml:mtext>
                                <mml:mi>i</mml:mi>
                            </mml:msub>
                            <mml:mo>=</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msub>
                                    <mml:mi>y</mml:mi>
                                    <mml:mrow>
                                        <mml:mtext mathvariant="italic">true</mml:mtext>
                                        <mml:mo>,</mml:mo>
                                        <mml:mi>i</mml:mi>
                                    </mml:mrow>
                                </mml:msub>
                                <mml:mo>.</mml:mo>
                                <mml:mo>log</mml:mo>
                                <mml:mrow>
                                    <mml:mo stretchy="true">(</mml:mo>
                                    <mml:msub>
                                        <mml:mi>y</mml:mi>
                                        <mml:mrow>
                                            <mml:mtext mathvariant="italic">pred</mml:mtext>
                                            <mml:mo>,</mml:mo>
                                            <mml:mi>i</mml:mi>
                                        </mml:mrow>
                                    </mml:msub>
                                    <mml:mo>+</mml:mo>
                                    <mml:mi mathvariant="normal">&#x03b5;</mml:mi>
                                    <mml:mo stretchy="true">)</mml:mo>
                                </mml:mrow>
                                <mml:mo>+</mml:mo>
                                <mml:mrow>
                                    <mml:mo stretchy="true">(</mml:mo>
                                    <mml:mn>1</mml:mn>
                                    <mml:mo>&#x2212;</mml:mo>
                                    <mml:msub>
                                        <mml:mi>y</mml:mi>
                                        <mml:mrow>
                                            <mml:mtext mathvariant="italic">true</mml:mtext>
                                            <mml:mo>,</mml:mo>
                                            <mml:mi>i</mml:mi>
                                        </mml:mrow>
                                    </mml:msub>
                                    <mml:mo stretchy="true">)</mml:mo>
                                </mml:mrow>
                                <mml:mo>.</mml:mo>
                                <mml:mo>log</mml:mo>
                                <mml:mrow>
                                    <mml:mo stretchy="true">(</mml:mo>
                                    <mml:mn>1</mml:mn>
                                    <mml:mo>&#x2212;</mml:mo>
                                    <mml:msub>
                                        <mml:mi>y</mml:mi>
                                        <mml:mrow>
                                            <mml:mtext mathvariant="italic">pred</mml:mtext>
                                            <mml:mo>,</mml:mo>
                                            <mml:mi>i</mml:mi>
                                        </mml:mrow>
                                    </mml:msub>
                                    <mml:mo>+</mml:mo>
                                    <mml:mi mathvariant="normal">&#x03b5;</mml:mi>
                                    <mml:mo stretchy="true">)</mml:mo>
                                </mml:mrow>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>

                        <label>(1)</label>
</disp-formula>
                </p>
                <p>A small constant &#x03b5; = 1 X 10
                    <sup>&#x2212;10</sup> is introduced to ensure numerical stability in the logarithmic calculations when the prediction probability approached 0 or 1. Gradient descent helps to iteratively update the weights of the base models by calculating the direction of the steepest descent of the loss function. By minimizing the average loss, which is the average binary cross-entropy across all data points (
                    <xref ref-type="disp-formula" rid="e2">
Equation 2</xref>), gradient descent allows the model to adjust its predictions in a way that maximizes accuracy while balancing the contributions of each base model in the ensemble.
                    <disp-formula id="e2">

                        <mml:math display="block">
                            <mml:mtext mathvariant="italic">loss</mml:mtext>
                            <mml:mo>=</mml:mo>
                            <mml:mfrac>
                                <mml:mn>1</mml:mn>
                                <mml:mi>N</mml:mi>
                            </mml:mfrac>
                            <mml:munderover>
                                <mml:mo>&#x2211;</mml:mo>
                                <mml:mrow>
                                    <mml:mi>i</mml:mi>
                                    <mml:mo>=</mml:mo>
                                    <mml:mn>1</mml:mn>
                                </mml:mrow>
                                <mml:mi>N</mml:mi>
                            </mml:munderover>
                            <mml:msub>
                                <mml:mtext mathvariant="italic">loss</mml:mtext>
                                <mml:mi>i</mml:mi>
                            </mml:msub>
                        </mml:math>

                        <label>(2)</label>
</disp-formula>
                </p>
                <p>
This iterative procedure continues until the loss converges, thereby guaranteeing that the ensemble model is fine-tuned to its optimal performance. The effectiveness of the algorithm also strongly depends on factors such as the learning rate, early stopping (patience), and aggregation strategy via weighted averages. The learning rate is a critical factor in solving the gradient descent optimization to achieve a trade-off between overshooting and slow convergence. Early stopping stops training when the model performance starts to improve to prevent overfitting. The &#x201c;patience&#x201d; parameter control number of iteration algorithm to wait before stopping, hence used to prevent over-fitting. Similarly, while aggregating, we can simply use weighted averaging by weights that best increase the overall predictive power of the model in the ensemble.</p>
            </sec>
            <sec id="sec11">
                <title>Evaluation matrix</title>
                <p>In the context of imbalanced datasets, it is important to look beyond accuracy to comprehensively understand performance. Accuracy measures the correct predictions, but when there are different numbers of records for each class, it could lead to misleading conclusions. Precision centers around the percentage of the positive predictions made by the model that are correct, meaning that it determines how good the model is at not making false positives. Recall, or Sensitivity, measures how well the model identifies true positives among them and might be important when attempting to capture a minority class. The F1-score is the harmonic mean of precision and recall, avoiding either false positives or false negatives that dominate the evaluation. An ROC curve shows the trade-off between true-positive and false-positive rates at various thresholds, which aids in understanding the discriminative ability of a model. The AUC measures the capability of the model to distinguish between positive and negative classes by plotting a line on the ROC curve. Given the imbalanced nature of our datasets, these metrics are crucial for ensuring a more nuanced and reliable assessment of the model performance. The formulas to compute the performance matrices are mentioned in 
                    <xref ref-type="table" rid="T4">
Table 3</xref>.</p>
                <table-wrap id="T4" orientation="portrait" position="float">
                    <label>
Table 3. </label>
                    <caption>
                        <title>Performance matrices and their mathematical notations.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Performance matric</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Mathematical notation</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Accuracy (Acc)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">

                                    <inline-formula>

                                        <mml:math display="inline">
                                            <mml:mfrac>
                                                <mml:mn>1</mml:mn>
                                                <mml:mi>n</mml:mi>
                                            </mml:mfrac>
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>i</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mi>n</mml:mi>
                                            </mml:munderover>
                                            <mml:mn>1</mml:mn>
                                            <mml:mrow>
                                                <mml:mo stretchy="true">(</mml:mo>
                                                <mml:msub>
                                                    <mml:mi>y</mml:mi>
                                                    <mml:mi>i</mml:mi>
                                                </mml:msub>
                                                <mml:mo>=</mml:mo>
                                                <mml:mover accent="true">
                                                    <mml:msub>
                                                        <mml:mi>y</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                    </mml:msub>
                                                    <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                </mml:mover>
                                                <mml:mo stretchy="true">)</mml:mo>
                                            </mml:mrow>
                                        </mml:math>
</inline-formula>
</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Precision (P)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">

                                    <inline-formula>

                                        <mml:math display="inline">
                                            <mml:mfrac>
                                                <mml:mrow>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:mn>1</mml:mn>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:msub>
                                                            <mml:mi>y</mml:mi>
                                                            <mml:mi>i</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo>=</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mspace width="0.25em"/>
                                                        <mml:mi mathvariant="normal">&#x039b;</mml:mi>
                                                        <mml:mspace width="0.25em"/>
                                                        <mml:mover accent="true">
                                                            <mml:msub>
                                                                <mml:mi>y</mml:mi>
                                                                <mml:mi>i</mml:mi>
                                                            </mml:msub>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mo>=</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:mrow>
                                                <mml:mrow>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:mn>1</mml:mn>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:mover accent="true">
                                                            <mml:msub>
                                                                <mml:mi>y</mml:mi>
                                                                <mml:mi>i</mml:mi>
                                                            </mml:msub>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mo>=</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:mrow>
                                            </mml:mfrac>
                                        </mml:math>
</inline-formula>
</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Recall (R)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">

                                    <inline-formula>

                                        <mml:math display="inline">
                                            <mml:mfrac>
                                                <mml:mrow>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:mn>1</mml:mn>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:msub>
                                                            <mml:mi>y</mml:mi>
                                                            <mml:mi>i</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo>=</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mspace width="0.25em"/>
                                                        <mml:mi mathvariant="normal">&#x039b;</mml:mi>
                                                        <mml:mspace width="0.25em"/>
                                                        <mml:mover accent="true">
                                                            <mml:msub>
                                                                <mml:mi>y</mml:mi>
                                                                <mml:mi>i</mml:mi>
                                                            </mml:msub>
                                                            <mml:mo stretchy="true">&#x0302;</mml:mo>
                                                        </mml:mover>
                                                        <mml:mo>=</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:mrow>
                                                <mml:mrow>
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>n</mml:mi>
                                                    </mml:munderover>
                                                    <mml:mn>1</mml:mn>
                                                    <mml:mrow>
                                                        <mml:mo stretchy="true">(</mml:mo>
                                                        <mml:msub>
                                                            <mml:mi>y</mml:mi>
                                                            <mml:mi>i</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo>=</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mo stretchy="true">)</mml:mo>
                                                    </mml:mrow>
                                                    <mml:mspace width="0.25em"/>
                                                </mml:mrow>
                                            </mml:mfrac>
                                        </mml:math>
</inline-formula>
</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">F1-Score</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2 x (P x R) / (P + R)</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Area Under Curve (AUC)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">

                                    <inline-formula>

                                        <mml:math display="inline">
                                            <mml:mi mathvariant="italic">AUC</mml:mi>
                                            <mml:mo>&#x2248;</mml:mo>
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>i</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mrow>
                                                    <mml:mi>n</mml:mi>
                                                    <mml:mo>&#x2212;</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                            </mml:munderover>
                                            <mml:mrow>
                                                <mml:mo stretchy="true">(</mml:mo>
                                                <mml:mspace width="0.25em"/>
                                                <mml:msub>
                                                    <mml:mi mathvariant="italic">TPR</mml:mi>
                                                    <mml:mi>i</mml:mi>
                                                </mml:msub>
                                                <mml:mo>+</mml:mo>
                                                <mml:msub>
                                                    <mml:mi mathvariant="italic">TPR</mml:mi>
                                                    <mml:mrow>
                                                        <mml:mi>i</mml:mi>
                                                        <mml:mo>+</mml:mo>
                                                        <mml:mn>1</mml:mn>
                                                    </mml:mrow>
                                                </mml:msub>
                                                <mml:mo stretchy="true">)</mml:mo>
                                            </mml:mrow>
                                            <mml:mo>&#x00d7;</mml:mo>
                                            <mml:mfrac>
                                                <mml:mrow>
                                                    <mml:mo stretchy="true">(</mml:mo>
                                                    <mml:msub>
                                                        <mml:mi mathvariant="italic">FPR</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mi>i</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                    </mml:msub>
                                                    <mml:mo>&#x2212;</mml:mo>
                                                    <mml:msub>
                                                        <mml:mi mathvariant="italic">FPR</mml:mi>
                                                        <mml:mi>i</mml:mi>
                                                    </mml:msub>
                                                    <mml:mo stretchy="true">)</mml:mo>
                                                </mml:mrow>
                                                <mml:mn>2</mml:mn>
                                            </mml:mfrac>
                                        </mml:math>
</inline-formula>
</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <p>Note: Where n is the total number of observations in the dataset and y
                            <sub>i</sub> and 
                            <inline-formula>

                                <mml:math display="inline">
                                    <mml:mover accent="true">
                                        <mml:msub>
                                            <mml:mi>y</mml:mi>
                                            <mml:mi>i</mml:mi>
                                        </mml:msub>
                                        <mml:mo stretchy="true">&#x0302;</mml:mo>
                                    </mml:mover>
                                </mml:math>
</inline-formula> are the true and false labels for the i
                            <sup>th</sup> sample, respectively.</p>
                    </table-wrap-foot>
                </table-wrap>
            </sec>
        </sec>
        <sec id="sec12">
            <title>Experimental results</title>
            <p>The experimental results of our ensemble model are presented in this section, and an in-depth analysis of its performance over several datasets is carried out. The effectiveness of GBWOEM is evaluated by both the variant GBWOEM-R (random initialization) and GBWOEM-U (uniform initialization) on five datasets with various dimensionalities and characters. Given the diversity of base models used in the ensemble: LR, DT, KNN, RF, and MLP, we methodically assessed combinations of two, three, four, and all five base models. We quantified the quality of these results using standard metrics and drew particular attention to how different weight initialization strategies affect the generalizability of an ensemble across datasets with different dimensionalities.</p>
            <sec id="sec13">
                <title>Breast cancer dataset</title>
                <p>This dataset has 369 entries, which has 31 features altogether derived from FNA images of breast tumors, with diagnosis as the target variable. A performance analysis of both variants of GBWOEM is presented in 
                    <xref ref-type="fig" rid="f3">
Figure 3</xref>. In GBWOEM-R, the LR (0.058) and RFC (1.002) pairs achieve the highest test accuracy and AUC values, where RFC having a significantly higher weight, indicating its stronger contribution. In GBWOEM-U, although the LR (0.5) and DTC (0.505) pair gave the highest accuracy when we considered both accuracy and AUC, the LR (0.5) and MLP (0.501) pair performs best. For both pairs, the weights of the base models are almost equal, suggesting a more balanced contribution from each base model. Pairs such as (LR, DTC), (LR, RFC), and (LR, KNN) are performing consistently across both variants, underlining their robustness. However, in both the models, increasing the number of base models led to overfitting, increases the training accuracy to 100%, but reduction in the test accuracy. This highlights the importance of careful base model selection and weight optimization to avoid overfitting when scaling up the ensemble.</p>
                <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                    <label>
Figure 3. </label>
                    <caption>
                        <title>Performance matrices of GBWOEM (R&amp;U) on Breast Cancer Dataset.</title>
                    </caption>
                    <graphic id="gr3" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure3.gif"/>
                </fig>
            </sec>
            <sec id="sec14">
                <title>Pima Indians diabetes database</title>
                <p>This is a common dataset utilized for research on diabetes and machine learning, which contains eight medical predictor variables, one target variable, and 768 entries. After data pre-processing, it is noticed that some columns have invalid 0&#x2019;s, which are replaced with the min or median of those columns. The performances of both variants of our proposed ensemble model are presented in 
                    <xref ref-type="fig" rid="f4">
Figure 4</xref>. In GBWOEN-R, the (LR, RFC) (0.695, 1.0) and (DTC, RFC, KNN, MLP) (0.102, 0.727, 0.145, 0.027) pairs showed the highest accuracy, but (LR, RFC) achieved a higher AUC with RFC having the highest weights and more contribution to the final ensemble result. In GBWOEM-U, the combination of all five base models yielded the highest accuracy but a low AUC value. Again, (LR, RFC) (0.521, 1.102) achieves a balanced accuracy and AUC, with RFC dominating.</p>
                <fig fig-type="figure" id="f4" orientation="portrait" position="float">
                    <label>
Figure 4. </label>
                    <caption>
                        <title>Performance matrices of GBWOEM (R&amp;U) on Pima Indians Diabetes Database.</title>
                    </caption>
                    <graphic id="gr4" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure4.gif"/>
                </fig>
            </sec>
            <sec id="sec15">
                <title>Diabetic Retinopathy Debrecen Database</title>
                <p>The Diabetic Retinopathy Debrecen Database, comprising 1,151 instances and 19 features, helps predict diabetic retinopathy using image-driven features. The performances of GBWOEM-R and GBWOEM-U are represented in 
                    <xref ref-type="fig" rid="f5">
Figure 5</xref>. In GBWOEM-R, (LR, MLP) (0.877, 0.542), (LR, RFC, MLP) (0.341, 0.433, 0.346), and (LR, KNN, MLP) (0.322, 0.25, 0.515) achieved the highest accuracy, whereas (LR, KNN, MLP) had the best AUC. From the final weight of each base model, it can be concluded that all models contribute significantly to the final result. The GBWOEM-U variant achieved slightly higher accuracy than GBWOEM-R, but had a lower AUC value. In this variant, (KNN, MLP) (0.501, 0.501) showed higher accuracy, where each model contributed equally. However, as per the AUC concern, the (LR, KNN, MLP) pair provides balanced results for both variants.</p>
                <fig fig-type="figure" id="f5" orientation="portrait" position="float">
                    <label>
Figure 5. </label>
                    <caption>
                        <title>Performance matrices of GBWOEM (R&amp;U) on Diabetic Retinopathy Database.</title>
                    </caption>
                    <graphic id="gr5" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure5.gif"/>
                </fig>
            </sec>
            <sec id="sec16">
                <title>Obesity database</title>
                <p>This dataset includes 2,111 instances and 17 features related to lifestyle and dietary habits. The target column is divided into different classes, including normal weight, underweight, overweight, and obese (I, II, and III). For our experiment, we reclassified the target variable into binary classes, classifying all obesity levels as class 1 and other classes as 0 because the goal is to detect obesity. The performance analyses of GBWOEM-R and GBWOEM-U on this dataset are represented in 
                    <xref ref-type="fig" rid="f6">
Figure 6</xref>.</p>
                <fig fig-type="figure" id="f6" orientation="portrait" position="float">
                    <label>
Figure 6. </label>
                    <caption>
                        <title>Performance matrices of GBWOEM (R&amp;U) on Obesity Database.</title>
                    </caption>
                    <graphic id="gr6" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure6.gif"/>
                </fig>
                <p>Both variants performed exceptionally well, with accuracy and AUC values reaching or exceeding 99% across all combinations. In all GBWOEM-U pairs, weights are evenly distributed with minimal adjustment. Pair-like (LR, DTC), (LR, KNN), and (LR, RFC) algorithms continue to perform well, consistent with their performance across other datasets. For this dataset, the higher-order combinations (e.g., 5C3-5C5) perform well in the testing phase, and the training-testing accuracy gap is minimal, suggesting better generalization, possibly due to the nature of the attributes or the binary classification approach we employed.</p>
            </sec>
            <sec id="sec17">
                <title>Thyroid disease</title>
                <p>Hypothyroid Disease includes 3,711 entries and 30 features for the detection of hypothyroidism. Both the variants GBWOEM-R and GBOWEM-U are performing well, where almost all the pairs are achieving accuracy over 93% and AUC over 96%, as presented in 
                    <xref ref-type="fig" rid="f7">
Figure 7</xref>. Similar to the Obesity dataset, the difference between the training and testing results is minimal, and higher-order combinations also perform well, likely resulting in a large sample size in both datasets. In GBWOEM-R, models such as DTC and RFC contribute more to their corresponding pairs with respect to other models. In GBWOEM-U, almost all base models have equal weights in their respective pairs and require minimal weight correction during optimization. This balance suggests a uniform contribution from all models, which may contribute to strong performance across multiple metrics.</p>
                <fig fig-type="figure" id="f7" orientation="portrait" position="float">
                    <label>
Figure 7. </label>
                    <caption>
                        <title>Performance matrices of GBWOEM (R&amp;U) on Thyroid Disease.</title>
                    </caption>
                    <graphic id="gr7" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure7.gif"/>
                </fig>
            </sec>
            <sec id="sec18">
                <title>Comparison with existing ensemble model</title>
                <p>This section of the Results and Discussion section shows a comparison between GBWOEM and other existing ensemble models: Adaboost, Catboost, GradientBoost, LightGBM, and XGBoost. This will help us establish the potential benefits of our method in terms of precision, AUC, and generalization capability. Our model led to the enhancement of test accuracy compared to existing ensemble models, with improvements between 0.48% and 8.26% across all five datasets. The specific accuracy gains for each dataset were as follows: Breast Cancer (5.32%), Pima Indians Diabetes Database (2.60%), Diabetic Retinopathy Debrecen (8.26%), Obesity Level estimation based on physical condition and eating habits (0.48%), and Thyroid Disease (2.32%). Although these values differ in the amount of improvement they contribute, this highlights that one of the great features of GBWOEM is that it is capable of handling various datasets and tasks efficiently.</p>
                <p>A comprehensive comparative quantitative performance for the details is given in 
                    <xref ref-type="table" rid="T5">
Table 4</xref> between the training and test accuracies of both the GBWOEM and existing models. In addition, ROC curves were drawn for each dataset for these five ensemble models and two variants of GBWOEM (GBWOEM-R and GBWOEM-U). It is very useful in the case of imbalanced datasets and helps us better understand how the model separates classes. From 
                    <xref ref-type="fig" rid="f9">
Figure 9</xref>, we can see that both variants of the proposed GBWOEM are able to distinguish between classes well for all datasets except PID DS. The models shows comparable results (80-90%) for performance matrices like precision, recall and F1-score, which rules out overfitting and is evident in 
                    <xref ref-type="fig" rid="f3">
Figures 3</xref>, 
                    <xref ref-type="fig" rid="f6">6</xref>, and 
                    <xref ref-type="fig" rid="f7">7</xref>. A bar chart (
                    <xref ref-type="fig" rid="f8">
Figure 8</xref>) is also included to show the training and test accuracies of the baseline models vs. our additionally proposed GBWOEM variants to graphically display these differences in our model accuracy.</p>
                <table-wrap id="T5" orientation="portrait" position="float">
                    <label>
Table 4. </label>
                    <caption>
                        <title>Test accuracy and test AUC comparison between GBWOEM and existing ensemble models.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="2" valign="top">
Dataset</th>
                                <th align="left" colspan="6" rowspan="1" valign="top">Test accuracy</th>
                                <th align="left" colspan="6" rowspan="1" valign="top">Test AUC</th>
                            </tr>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">
AB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
CB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
GB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
LGBM</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
XGB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
GBWOEM</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
AB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
CB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
GB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
LGBM</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
XGB</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
GBWOEM</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="middle">BC DS</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">70.43</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.57</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">71.74</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">62.61</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">74.68</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">80</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">70.38</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.98</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">72.14</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">61.41</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.85</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">89.65</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="middle">PID DS</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">75.32</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">71.43</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">74.68</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">74.03</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">74.68</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">77.92</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">71.2</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">67.35</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">70.28</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.78</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.85</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">83.69</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="middle">DRD DS</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">70.43</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">70.43</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.57</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">71.74</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">62.61</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">80</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">71.12</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">70.38</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">69.98</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">72.14</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">61.41</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">89.65</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="middle">OL DS</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.28</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.52</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.28</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.52</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.52</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">100</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.26</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.49</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.26</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.49</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.49</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">100</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="middle">TH DS</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">95.79</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">94.73</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">95.54</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">95.79</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">94.79</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">98.11</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">82.35</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">87.11</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">85.94</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">82.35</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">84.47</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">99.74</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig fig-type="figure" id="f8" orientation="portrait" position="float">
                    <label>
Figure 8. </label>
                    <caption>
                        <title>Comparison of training and testing accuracy between existing and proposed ensemble model for all the datasets.</title>
                    </caption>
                    <graphic id="gr8" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure8.gif"/>
                </fig>
                <fig fig-type="figure" id="f9" orientation="portrait" position="float">
                    <label>
Figure 9. </label>
                    <caption>
                        <title>ROC Plot of existing and proposed GBWOEM (R&amp;U) model (a) BC DS, (b) PID DS, (c) DRD DS, (d) OL DS and (e) TH DS.</title>
                    </caption>
                    <graphic id="gr9" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195371/744c354a-e679-40bb-80ed-d5612f6ac413_figure9.gif"/>
                </fig>
            </sec>
        </sec>
        <sec id="sec19">
            <title>Conclusion and future work</title>
            <p>In this study, we proposed the Gradient-Based Weight Optimized Ensemble Model (GBWOEM) consisting two variants, GBWOEM-R (random initialization) and GBWOEM-U (uniform initialization), designed to improve classification performance by dynamic weight optimisation for LR, DTC, KNN, RFC and MLP base models. Using the weighted average approach, the model&#x2019;s weights are treated as real-valued variables optimized using gradient descent. The model was evaluated on five diverse datasets: Breast Cancer, Pima Indians Diabetes Database, Diabetic Retinopathy Debrecen, Obesity Level estimation based on physical condition and eating habits, and Thyroid Disease, each with unique characteristics and dimensions. In the end, we observed significant improvements in test accuracy across all datasets, with a gain of 0.48% to 8.26%, as compared to existing ensemble models, namely Adaboost, Catboost, GradientBoost, LightGBM, and XGBoost. GBWOEM achieved its highest increase in accuracy on the Diabetic Retinopathy Debrecen dataset, suggesting that GBOWOEM effectively addresses complex, feature-rich datasets. While both GBWOEM variants showed similar functional behaviour, GBWOEM-R favoured certain based models like RFC due to uneven weight distribution, but GBWOEM-U showed even distribution of weights and delivered more balanced and stable results across the dataset. In addition, the ROC curves and AUC values confirmed GBWOEM&#x2019;s robustness of GBWOEM on various datasets. Surprisingly, increasing the number of base models contextually increases the training accuracy (up 100% in some cases) but not test performance, emphasizing the risk of overfitting in ensemble models. The dynamic weight optimization of the GBWOEM was shown to be a key strength, allowing flexibility across datasets with different dimensions and class distributions. Future work aims to incorporate advanced weight optimization techniques, such as adaptive learning rates or metaheuristic approaches, and test the model in multi-class and large-scale datasets for broader validation while maintaining lower computational complexity.</p>
        </sec>
    </body>
    <back>
        <sec id="sec22" sec-type="data-availability">
            <title>Data availability</title>
            <p>The datasets used in this research are publicly available and can be accessed through the following DOIs:
                <list list-type="bullet">
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Diabetic Retinopathy Debrecen (
                            <ext-link ext-link-type="uri" xlink:href="https://archive.ics.uci.edu/dataset/329/diabetic+retinopathy+debrecen">https://archive.ics.uci.edu/dataset/329/diabetic+retinopathy+debrecen</ext-link>; doi:10.24432/C5XP4P),</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Estimation of Obesity Levels Based On Eating Habits and Physical Condition (
                            <ext-link ext-link-type="uri" xlink:href="https://archive.ics.uci.edu/dataset/544/estimation+of+obesity+levels+based+on+eating+habits+and+physical+condition">https://archive.ics.uci.edu/dataset/544/estimation+of+obesity+levels+based+on+eating+habits+and+physical+condition</ext-link>; doi:10.24432/C5H31Z),</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Thyroid Disease (
                            <ext-link ext-link-type="uri" xlink:href="https://archive.ics.uci.edu/dataset/102/thyroid+disease">https://archive.ics.uci.edu/dataset/102/thyroid+disease</ext-link>; doi:10.24432/C5D010).</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>The Pima Indians Diabetes Dataset, originally hosted on UCI ML Repository is no longer available there. However, it can be accessed via Kaggle at 
                            <ext-link ext-link-type="uri" xlink:href="https://www.kaggle.com/datasets/uciml/pima-indians-diabetes-database">https://www.kaggle.com/datasets/uciml/pima-indians-diabetes-database
</ext-link>.</p>
                    </list-item>
                </list>
            </p>
        </sec>
        <ref-list>
            <title>References</title>
            <ref id="ref1">
                <label>1</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Mahajan</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Uddin</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hajati</surname>
                            <given-names>F</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Ensemble Learning for Disease Prediction: A Review.</article-title>
                    <source>

                        <italic toggle="yes">Healthcare.</italic>
</source>
                    <year>Jun. 2023</year>;<volume>11</volume>(<issue>12</issue>):<fpage>1808</fpage>.
                    <pub-id pub-id-type="pmid">37372925</pub-id>
                    <pub-id pub-id-type="doi">10.3390/healthcare11121808</pub-id>
                    <pub-id pub-id-type="pmcid">PMC10298658</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wazid</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Singh</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Das</surname>
                            <given-names>AK</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>An Ensemble-Based Machine Learning-Envisioned Intrusion Detection in Industry 5.0-Driven Healthcare Applications.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Trans. Consum. Electron.</italic>
</source>
                    <year>Feb. 2024</year>;<volume>70</volume>(<issue>1</issue>):<fpage>1903</fpage>&#x2013;<lpage>1912</lpage>.
                    <pub-id pub-id-type="doi">10.1109/TCE.2023.3318850</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Abidi</surname>
                            <given-names>MH</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Umer</surname>
                            <given-names>U</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mian</surname>
                            <given-names>SH</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Big Data-Based Smart Health Monitoring System: Using Deep Ensemble Learning.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2023</year>;<volume>11</volume>:<fpage>114880</fpage>&#x2013;<lpage>114903</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ACCESS.2023.3325323</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>C-L</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A bagging approach for improved predictive accuracy of intradialytic hypotension during hemodialysis treatment.</article-title>
                    <source>

                        <italic toggle="yes">Comput. Biol. Med.</italic>
</source>
                    <year>Apr. 2024</year>;<volume>172</volume>:<fpage>108244</fpage>.
                    <pub-id pub-id-type="pmid">38457931</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.compbiomed.2024.108244</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Yin</surname>
                            <given-names>H</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Predicting the climate impact of healthcare facilities using gradient boosting machines.</article-title>
                    <source>

                        <italic toggle="yes">Cleaner Environmental Systems.</italic>
</source>
                    <year>Mar. 2024</year>;<volume>12</volume>:<fpage>100155</fpage>.
                    <pub-id pub-id-type="pmid">38444563</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.cesys.2023.100155</pub-id>
                    <pub-id pub-id-type="pmcid">PMC10909736</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rehman</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mujahid</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Saba</surname>
                            <given-names>T</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Optimised stacked machine learning algorithms for genomics and genetics disorder detection in the healthcare industry.</article-title>
                    <source>

                        <italic toggle="yes">Funct. Integr. Genomics.</italic>
</source>
                    <year>Feb. 2024</year>;<volume>24</volume>(<issue>1</issue>):<fpage>23</fpage>.
                    <pub-id pub-id-type="pmid">38305949</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s10142-024-01289-z</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Das</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nayak</surname>
                            <given-names>SP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sahoo</surname>
                            <given-names>B</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Machine Learning in Healthcare Analytics: A State-of-the-Art Review.</article-title>
                    <source>

                        <italic toggle="yes">Archives of Computational Methods in Engineering.</italic>
</source>
                    <year>Apr. 2024</year>.
                    <pub-id pub-id-type="doi">10.1007/s11831-024-10098-3</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Younas</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Usman</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Yan</surname>
                            <given-names>WQ</given-names>
                        </name>
</person-group>:
                    <article-title>A deep ensemble learning method for colorectal polyp classification with optimized network parameters.</article-title>
                    <source>

                        <italic toggle="yes">Appl. Intell.</italic>
</source>
                    <year>2023</year>;<volume>53</volume>(<issue>2</issue>):<fpage>2410</fpage>&#x2013;<lpage>2433</lpage>.
                    <pub-id pub-id-type="doi">10.1007/s10489-022-03689-9</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Bhuiyan</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Islam</surname>
                            <given-names>MS</given-names>
                        </name>
</person-group>:
                    <article-title>A new ensemble learning approach to detect malaria from microscopic red blood cell images.</article-title>
                    <source>

                        <italic toggle="yes">Sensors International.</italic>
</source>
                    <year>2023</year>;<volume>4</volume>(<issue>August 2022</issue>):<fpage>100209</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.sintl.2022.100209</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Marques</surname>
                            <given-names>G</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ferreras</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Torre-Diez</surname>
                            <given-names>I</given-names>
                            <prefix>de la</prefix>
                        </name>
</person-group>:
                    <article-title>An ensemble-based approach for automated medical diagnosis of malaria using EfficientNet.</article-title>
                    <source>

                        <italic toggle="yes">Multimed. Tools Appl.</italic>
</source>
                    <year>2022</year>;<volume>81</volume>(<issue>19</issue>):<fpage>28061</fpage>&#x2013;<lpage>28078</lpage>.
                    <pub-id pub-id-type="pmid">35368860</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s11042-022-12624-6</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8964254</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ali</surname>
                            <given-names>F</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A smart healthcare monitoring system for heart disease prediction based on ensemble deep learning and feature fusion.</article-title>
                    <source>

                        <italic toggle="yes">Information Fusion.</italic>
</source>
                    <year>2020</year>;<volume>63</volume>:<fpage>208</fpage>&#x2013;<lpage>222</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.inffus.2020.06.008</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Dutta</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Early Prediction of Diabetes Using an Ensemble of Machine Learning Models.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Environ. Res. Public Health.</italic>
</source>
                    <year>2022</year>;<volume>19</volume>(<issue>19</issue>):<fpage>1</fpage>&#x2013;<lpage>25</lpage>.
                    <pub-id pub-id-type="pmid">36231678</pub-id>
                    <pub-id pub-id-type="doi">10.3390/ijerph191912378</pub-id>
                    <pub-id pub-id-type="pmcid">PMC9566114</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ihnaini</surname>
                            <given-names>B</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A Smart Healthcare Recommendation System for Multidisciplinary Diabetes Patients with Data Fusion Based on Deep Ensemble Learning.</article-title>
                    <source>

                        <italic toggle="yes">Comput. Intell. Neurosci.</italic>
</source>
                    <year>2021</year>;<volume>2021</volume>.
                    <pub-id pub-id-type="pmid">34567101</pub-id>
                    <pub-id pub-id-type="doi">10.1155/2021/4243700</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8463188</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Reddy</surname>
                            <given-names>GT</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>An Ensemble based Machine Learning model for Diabetic Retinopathy Classification.</chapter-title>
                    <source>

                        <italic toggle="yes">International Conference on Emerging Trends in Information Technology and Engineering, ic-ETITE 2020.</italic>
</source>
                    <year>2020</year>; pp.<fpage>1</fpage>&#x2013;<lpage>6</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ic-ETITE47903.2020.235</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Bin Habib</surname>
                            <given-names>AZS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tasnim</surname>
                            <given-names>T</given-names>
                        </name>
</person-group>:
                    <chapter-title>An Ensemble Hard Voting Model for Cardiovascular Disease Prediction.</chapter-title>
                    <source>

                        <italic toggle="yes">2020 2nd International Conference on Sustainable Technologies for Industry 4.0, STI 2020.</italic>
</source>
                    <year>2020</year>; pp.<fpage>19</fpage>&#x2013;<lpage>20</lpage>.
                    <pub-id pub-id-type="doi">10.1109/STI50764.2020.9350514</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Amin</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hasan</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zein-Sabatto</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>An Explainable AI Framework for Artificial Intelligence of Medical Things.</chapter-title>
                    <source>

                        <italic toggle="yes">2023 IEEE Globecom Workshops, GC Wkshps 2023.</italic>
</source>
                    <year>2023</year>; pp.<fpage>2097</fpage>&#x2013;<lpage>2102</lpage>.
                    <pub-id pub-id-type="doi">10.1109/GCWkshps58843.2023.10464798</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>El-Sappagh</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ali</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Abuhmed</surname>
                            <given-names>T</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Automatic detection of Alzheimer&#x2019;s disease progression: An efficient information fusion approach with heterogeneous ensemble classifiers.</article-title>
                    <source>

                        <italic toggle="yes">Neurocomputing.</italic>
</source>
                    <year>2022</year>;<volume>512</volume>:<fpage>203</fpage>&#x2013;<lpage>224</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.neucom.2022.09.009</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Borba De Souza</surname>
                            <given-names>V</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Campos Nobre</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Becker</surname>
                            <given-names>K</given-names>
                        </name>
</person-group>:
                    <article-title>DAC Stacking: A Deep Learning Ensemble to Classify Anxiety, Depression, and Their Comorbidity From Reddit Texts.</article-title>
                    <source>

                        <italic toggle="yes">IEEE J. Biomed. Health Inform.</italic>
</source>
                    <year>2022</year>;<volume>26</volume>(<issue>7</issue>):<fpage>3303</fpage>&#x2013;<lpage>3311</lpage>.
                    <pub-id pub-id-type="pmid">35230959</pub-id>
                    <pub-id pub-id-type="doi">10.1109/JBHI.2022.3151589</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Osamor</surname>
                            <given-names>VC</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Okezie</surname>
                            <given-names>AF</given-names>
                        </name>
</person-group>:
                    <article-title>Enhancing the weighted voting ensemble algorithm for tuberculosis predictive diagnosis.</article-title>
                    <source>

                        <italic toggle="yes">Sci. Rep.</italic>
</source>
                    <year>2021</year>;<volume>11</volume>(<issue>1</issue>):<fpage>14806</fpage>&#x2013;<lpage>14811</lpage>.
                    <pub-id pub-id-type="pmid">34285324</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41598-021-94347-6</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8292494</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Subashchandrabose</surname>
                            <given-names>U</given-names>
                        </name>

                        <name name-style="western">
                            <surname>John</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Anbazhagu</surname>
                            <given-names>UV</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Ensemble Federated Learning Approach for Diagnostics of Multi-Order Lung Cancer.</article-title>
                    <source>

                        <italic toggle="yes">Diagnostics.</italic>
</source>
                    <year>2023</year>;<volume>13</volume>(<issue>19</issue>):<fpage>1</fpage>&#x2013;<lpage>14</lpage>.
                    <pub-id pub-id-type="pmid">37835796</pub-id>
                    <pub-id pub-id-type="doi">10.3390/diagnostics13193053</pub-id>
                    <pub-id pub-id-type="pmcid">PMC10572651</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Abbas</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Fused Weighted Federated Deep Extreme Machine Learning Based on Intelligent Lung Cancer Disease Prediction Model for Healthcare 5.0.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Intell. Syst.</italic>
</source>
                    <year>2023</year>;<volume>2023</volume>.
                    <pub-id pub-id-type="doi">10.1155/2023/2599161</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kotei</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Thirunavukarasu</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <article-title>Ensemble Technique Coupled with Deep Transfer Learning Framework for Automatic Detection of Tuberculosis from Chest X-ray Radiographs.</article-title>
                    <source>

                        <italic toggle="yes">Healthcare (Switzerland).</italic>
</source>
                    <year>2022</year>;<volume>10</volume>(<issue>11</issue>).
                    <pub-id pub-id-type="doi">10.3390/healthcare10112335</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Prakash</surname>
                            <given-names>EP</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Implementation of Artificial Neural Network to Predict Diabetes with High-Quality Health System.</article-title>
                    <source>

                        <italic toggle="yes">Comput. Intell. Neurosci.</italic>
</source>
                    <year>2022</year>;<volume>2022</volume>:<fpage>1</fpage>&#x2013;<lpage>7</lpage>.
                    <pub-id pub-id-type="pmid">35676959</pub-id>
                    <pub-id pub-id-type="doi">10.1155/2022/1174173</pub-id>
                    <pub-id pub-id-type="pmcid">PMC9170457</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>El-Rashidy</surname>
                            <given-names>N</given-names>
                        </name>

                        <name name-style="western">
                            <surname>El-Sappagh</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Abuhmed</surname>
                            <given-names>T</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Intensive Care Unit Mortality Prediction: An Improved Patient-Specific Stacking Ensemble Model.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2020</year>;<volume>8</volume>:<fpage>133541</fpage>&#x2013;<lpage>133564</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3010556</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rajaraman</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Siegelman</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Alderson</surname>
                            <given-names>PO</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Iteratively Pruned Deep Learning Ensembles for COVID-19 Detection in Chest X-Rays.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2020</year>;<volume>8</volume>:<fpage>115041</fpage>&#x2013;<lpage>115050</lpage>.
                    <pub-id pub-id-type="pmid">32742893</pub-id>
                    <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3003810</pub-id>
                    <pub-id pub-id-type="pmcid">PMC7394290</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rajaraman</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Antani</surname>
                            <given-names>SK</given-names>
                        </name>
</person-group>:
                    <article-title>Modality-Specific Deep Learning Model Ensembles Toward Improving TB Detection in Chest Radiographs.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2020</year>;<volume>8</volume>:<fpage>27318</fpage>&#x2013;<lpage>27326</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ACCESS.2020.2971257</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Juraev</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>El-Sappagh</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Abdukhamidov</surname>
                            <given-names>E</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Multilayer dynamic ensemble model for intensive care unit mortality prediction of neonate patients.</article-title>
                    <source>

                        <italic toggle="yes">J. Biomed. Inform.</italic>
</source>
                    <year>2022</year>;<volume>135</volume>(<issue>October</issue>):<fpage>104216</fpage>.
                    <pub-id pub-id-type="pmid">36208833</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.jbi.2022.104216</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Anand</surname>
                            <given-names>V</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Weighted Average Ensemble Deep Learning Model for Stratification of Brain Tumor in MRI Images.</article-title>
                    <source>

                        <italic toggle="yes">Diagnostics.</italic>
</source>
                    <year>2023</year>;<volume>13</volume>(<issue>7</issue>).
                    <pub-id pub-id-type="pmid">37046538</pub-id>
                    <pub-id pub-id-type="doi">10.3390/diagnostics13071320</pub-id>
                    <pub-id pub-id-type="pmcid">PMC10093740</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref30">
                <label>29</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wolberg</surname>
                            <given-names>W</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mangasarian</surname>
                            <given-names>O</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Street</surname>
                            <given-names>N</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <source>

                        <italic toggle="yes">Breast Cancer Wisconsin (Diagnostic).</italic>
</source>
                    <publisher-name>UCI Machine Learning Repository</publisher-name>.
                    <pub-id pub-id-type="doi">10.24432/C5DW2B</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref31">
                <label>30</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Antal</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Balint</surname>
                        </name>

                        <name name-style="western">
                            <surname>Hajdu</surname>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Diabetic Retinopathy Debrecen.</italic>
</source>
                    <publisher-name>UCI Machine Learning Repository</publisher-name>.
                    <pub-id pub-id-type="doi">10.24432/C5XP4P</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref32">
                <label>31</label>
                <mixed-citation publication-type="other">
                    <collab>UCI MACHINE LEARNING</collab>:
                    <article-title>Pima Indians Diabetes Database.</article-title>
                    <source>

                        <italic toggle="yes">Version 1.</italic>
</source>
                    <ext-link ext-link-type="uri" xlink:href="https://www.kaggle.com/datasets/uciml/pima-indians-diabetes-database">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref33">
                <label>32</label>
                <mixed-citation publication-type="book">
                    <source>

                        <italic toggle="yes">Estimation of Obesity Levels Based On Eating Habits and Physical Condition.</italic>
</source>
                    <publisher-name>UCI Machine Learning Repository</publisher-name>.
                    <pub-id pub-id-type="doi">10.24432/C5H31Z</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref34">
                <label>33</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Quinlan</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Thyroid Disease.</italic>
</source>
                    <publisher-name>UCI Machine Learning Repository</publisher-name>.
                    <pub-id pub-id-type="doi">10.24432/C5D010</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref35">
                <label>34</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>MurtiRawat</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Panchal</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Singh</surname>
                            <given-names>VK</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>Breast Cancer Detection Using K-Nearest Neighbors, Logistic Regression and Ensemble Learning.</chapter-title>
                    <source>

                        <italic toggle="yes">2020 International Conference on Electronics and Sustainable Communication Systems (ICESC).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>Jul. 2020</year>; pp.<fpage>534</fpage>&#x2013;<lpage>540</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ICESC48915.2020.9155783</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref36">
                <label>35</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rahmatinejad</surname>
                            <given-names>Z</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A comparative study of explainable ensemble learning and logistic regression for predicting in-hospital mortality in the emergency department.</article-title>
                    <source>

                        <italic toggle="yes">Sci. Rep.</italic>
</source>
                    <year>Feb. 2024</year>;<volume>14</volume>(<issue>1</issue>):<fpage>3406</fpage>.
                    <pub-id pub-id-type="pmid">38337000</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41598-024-54038-4</pub-id>
                    <pub-id pub-id-type="pmcid">PMC10858239</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref37">
                <label>36</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rajendra</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Latifi</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>Prediction of diabetes using logistic regression and ensemble techniques.</article-title>
                    <source>

                        <italic toggle="yes">Computer Methods and Programs in Biomedicine Update.</italic>
</source>
                    <year>2021</year>;<volume>1</volume>:<fpage>100032</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.cmpbup.2021.100032</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref38">
                <label>37</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Madyatmadja</surname>
                            <given-names>ED</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Rianto</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Andry</surname>
                            <given-names>JF</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>Analysis of Big Data in Healthcare Using Decision Tree Algorithm.</chapter-title>
                    <source>

                        <italic toggle="yes">2021 1st International Conference on Computer Science and Artificial Intelligence (ICCSAI).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>Oct. 2021</year>; pp.<fpage>313</fpage>&#x2013;<lpage>317</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ICCSAI53272.2021.9609734</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref39">
                <label>38</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Mung</surname>
                            <given-names>PS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Phyu</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <chapter-title>Effective Analytics on Healthcare Big Data Using Ensemble Learning.</chapter-title>
                    <source>

                        <italic toggle="yes">2020 IEEE Conference on Computer Applications (ICCA).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>Feb. 2020</year>; pp.<fpage>1</fpage>&#x2013;<lpage>4</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ICCA49400.2020.9022853</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref40">
                <label>39</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jayasri</surname>
                            <given-names>NP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Aruna</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <article-title>Big data analytics in health care by data mining and classification techniques.</article-title>
                    <source>

                        <italic toggle="yes">ICT Express.</italic>
</source>
                    <year>Jun. 2022</year>;<volume>8</volume>(<issue>2</issue>):<fpage>250</fpage>&#x2013;<lpage>257</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.icte.2021.07.001</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref41">
                <label>40</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Alnowaiser</surname>
                            <given-names>K</given-names>
                        </name>
</person-group>:
                    <article-title>Improving Healthcare Prediction of Diabetic Patients Using KNN Imputed Features and Tri-Ensemble Model.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2024</year>;<volume>12</volume>:<fpage>16783</fpage>&#x2013;<lpage>16793</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ACCESS.2024.3359760</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref42">
                <label>41</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Niu</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ma</surname>
                            <given-names>Z</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Wind Turbine Condition Monitoring Based on Bagging Ensemble Strategy and KNN Algorithm.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2022</year>;<volume>10</volume>:<fpage>93412</fpage>&#x2013;<lpage>93420</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ACCESS.2022.3164717</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref43">
                <label>42</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Shanthakumari</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nalini</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Vinothkumar</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>Multi Disease Prediction System using Random Forest Algorithm in Healthcare System.</chapter-title>
                    <source>

                        <italic toggle="yes">2022 International Mobile and Embedded Technology Conference (MECON).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>Mar. 2022</year>; pp.<fpage>242</fpage>&#x2013;<lpage>247</lpage>.
                    <pub-id pub-id-type="doi">10.1109/MECON53876.2022.9752432</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref44">
                <label>43</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Nafouanti</surname>
                            <given-names>MB</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mustapha</surname>
                            <given-names>NA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prediction on the fluoride contamination in groundwater at the Datong Basin, Northern China: Comparison of random forest, logistic regression and artificial neural network.</article-title>
                    <source>

                        <italic toggle="yes">Appl. Geochem.</italic>
</source>
                    <year>Sep. 2021</year>;<volume>132</volume>:<fpage>105054</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.apgeochem.2021.105054</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref45">
                <label>44</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Butt</surname>
                            <given-names>UM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Letchmunan</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ali</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Machine Learning Based Diabetes Classification and Prediction for Healthcare Applications.</article-title>
                    <source>

                        <italic toggle="yes">J. Healthc. Eng.</italic>
</source>
                    <year>Sep. 2021</year>;<volume>2021</volume>:<fpage>1</fpage>&#x2013;<lpage>17</lpage>.
                    <pub-id pub-id-type="pmid">34631003</pub-id>
                    <pub-id pub-id-type="doi">10.1155/2021/9930985</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8500744</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref46">
                <label>45</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>J-C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>Y-M</given-names>
                        </name>
</person-group>:
                    <article-title>Comparing Activation Functions in Modeling Shoreline Variation Using Multilayer Perceptron Neural Network.</article-title>
                    <source>

                        <italic toggle="yes">Water (Basel).</italic>
</source>
                    <year>Apr. 2020</year>;<volume>12</volume>(<issue>5</issue>):<fpage>1281</fpage>.
                    <pub-id pub-id-type="doi">10.3390/w12051281</pub-id>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report458348">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.195371.r458348</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>John</surname>
                        <given-names>Anjum</given-names>
                    </name>
                    <xref ref-type="aff" rid="r458348a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-9873-8550</uri>
                </contrib>
                <aff id="r458348a1">
                    <label>1</label>Pushpagiri Medical College Hospital, Thiruvalla, Kerala, India</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>14</day>
                <month>2</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 John A</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport458348" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.169436.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>Thank you for allowing me to review this paper which is technically sound and is indexable material. There is novelty and a domain of technical contribution, with acceptable experimental benchmarking but&#x00a0; there are a few concerns about its theoretical depth, clinical translation, and external validation.</p>
            <p> </p>
            <p> 
                <bold>Major Strengths</bold>
            </p>
            <p> &#x00a0;1. Novel Methodological Idea: The core idea &#x2014; gradient-based dynamic weight optimization across heterogeneous base models &#x2014; is &#x00a0;relevant. The model&#x2019;s combination of LR, DT, RF, MLP, KNN uses gradient descent to optimize ensemble weights dynamically and shows measurable performance gain (0.48&#x2013;8.26%) vs standard ensembles. This novelty in applied ML is indexable though theoretical novelty may be insufficient.</p>
            <p> 2. Multi-Dataset Evaluation: The model used five healthcare datasets across domains were used &#x2014; improves perceived generalizability.</p>
            <p> 3. Proper ML Pipeline Elements used included Grid search CV, Train/validation/test splits, Early stopping, and Multiple metrics (AUC, F1, precision, recall)- which meets baseline reproducibility expectations.</p>
            <p> 4. Transparency Elements: Because public datasets used are listed, and the algorithm pseudo code provided, there is an element of transparency.</p>
            <p> </p>
            <p> 
                <bold>Major Concern</bold>
            </p>
            <p>
                <bold> </bold>
            </p>
            <p>
                <bold> 1.&#x00a0;Weak Theoretical Foundation:</bold> Though the model uses gradient descent, evidence of convergence behaviour, Stability conditions, Complexity scaling and Sensitivity to hyperparameters are not explained in detail. This has been flagged by other reviewers in terms of the lack of detailed theoretical rationale for the use of this model. Clarity on the theoretical model is necessary to improve the depth of understanding of the topic as a new one. Suggestions are to add, discussion on convexity, empirical convergence plots, and sensitivity analyses like learning rates, patience, and finalization.</p>
            <p> 2. 
                <bold>Interpretability </bold>&#x2014; As it stands the manuscript shows weight values without clinical meaning being demonstrated. Previous reviews have stated that the study focuses on accuracy but lacks interpretability; add SHAP/LIME. Healthcare ML publication require transparency in contributions, clinician usability, and decision pathway explanations. Please provide at least one of the following: SHAP global + local explanations, feature importance stability across folds, or case-based explanation examples.&#x00a0;</p>
            <p> 3. 
                <bold>External Validation Missing: </bold>For clinical MI credibility after publication, at least one of external dataset testing, Nested CV, or leave-one-dataset-out validation might be performed.</p>
            <p> 4.
                <bold> Possible Overfitting Signals</bold>: The authors show 100% training accuracy in some models with test performance dropping when model complexity increases. The authors can provide learning curves, calibration plots, or bootstrapped CI for AUC.</p>
            <p> 5. Class Imbalance Handling Not Methodologically Strong because the authors rely mostly rely on natural distribution, avoid SMOTE, and argue that performance metrics are stable. Not provided are PR-AUC reporting, Cost-sensitive learning, or Threshold optimization</p>
            <p> 6. 
                <bold>Clinical Relevance Is Mostly Theoretical: </bold>The paper claims that this method Improves patient outcomes, with diagnostic consistency but there was no clinical deployment scenario, and no decision threshold analysis.</p>
            <p> 7. 
                <bold>Dataset Choice Is Safe but Not Challenging:</bold> The datasets used for the stuffy are good for method comparison but weak for real clinical impact assessment.</p>
            <p> 8. Computational Costs important for regular use of the model like training time, memory, and scalability to large HER datasets are not assessed.</p>
            <p> 9. The inconsistencies in grammar, repetition of texts, density of figures, and claims of larger uses than that shown by the data, are minor flaws in the manuscript.</p>
            <p> </p>
            <p> 
                <bold>Recommendations</bold>: The manuscript presents a technically sound and novel ensemble optimization approach with consistent improvements across benchmark healthcare datasets. However, before strong endorsement, the work would benefit from enhanced theoretical grounding of the optimization procedure, additional validation on external datasets, and improved interpretability analyses to support real-world clinical applicability.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Qualitative Research Methods, Medical Students, Teaching, Learning, Public health</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report442725">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.186779.r442725</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>D</surname>
                        <given-names>Helen</given-names>
                    </name>
                    <xref ref-type="aff" rid="r442725a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r442725a1">
                    <label>1</label>SRM Institute of Science and Technology, Kattankulathur, Tamil Nadu, India</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>7</day>
                <month>1</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 D H</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport442725" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.169436.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>
                <list list-type="order">
                    <list-item>
                        <p>
                            <bold>Novelty and Contribution:</bold>
                        </p>
                        <p> The development of GBWOEM shows the meaningful advancement in ensemble learning method, with a clear focus on weight optimization. The proposed model is compared with standard algorithms and achieves improved accuracy, which highlights its potential contribution.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Methodology:</bold>
                        </p>
                        <p> The implementation of two different weight initialization methods&#x2014;random (GBWOEM-R) and uniform (GBWOEM-U)&#x2014;and the comparative analysis effectively show the impact of weight initialization on ensemble performance.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Interpretability:</bold>
                        </p>
                        <p> The paper could benefit from a more detailed explanation of how the optimized weights of base models contribute to the final predictions. This would enhance the interpretability and practical relevance of the model, especially in healthcare applications.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Class Imbalance:</bold>
                        </p>
                        <p> The datasets used are reported to have class imbalance. The authors should clarify how this imbalance was addressed during training and evaluation to ensure the results are reliable.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Overfitting Concern:</bold>
                        </p>
                        <p> In Figure 9, ROC curves with AUC values near 1.00 may indicate potential overfitting. The authors should verify these results, possibly by evaluating the models on independent or cross-validation datasets to ensure generalizability.</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Partly</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Partly</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Partly</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Partly</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Machine Learning, Deep Learning</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-442725-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Big data-driven optimal weighted fused features-based ensemble learning classifier for thyroid prediction with heuristic algorithm</article-title>.
                        <source>
                            <italic>Journal of Combinatorial Optimization</italic>
                        </source>.<year>2025</year>;<volume>49</volume>(<issue>4</issue>) :
                        <elocation-id>10.1007/s10878-025-01304-4</elocation-id>
                        <pub-id pub-id-type="doi">10.1007/s10878-025-01304-4</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
        <sub-article article-type="response" id="comment15283-442725">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Champati Rai</surname>
                            <given-names>Satyananda </given-names>
                        </name>
                        <aff>School of Computer Engineering, Kalinga Institute of Industrial Technology, Bhubaneswar, Odisha, India</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>There are no competing interests.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>16</day>
                    <month>1</month>
                    <year>2026</year>
                </pub-date>
            </front-stub>
            <body>
                <p>
                    <bold>Q1. The paper could benefit from a more detailed explanation of how the optimized weights of base models contribute to the final predictions. This would enhance the interpretability and practical relevance of the model, especially in healthcare applications.</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We thank the reviewer for this valuable suggestion regarding interpretability. To address this, we have expanded the result to explicitly detail how the optimized weights reflect the contribution of each base model.</p>
                <p> For example, as noted in the revised manuscript, in the GBWOEM-R variant, the Random Forest Classifier (RFC) was assigned a significantly higher weight (1.002) compared to Logistic Regression (0.058), quantitatively demonstrating RFC's stronger contribution to the decision boundary for this specific dataset. Additionally, as requested, we have updated the relevant performance comparison figures to include the final weights of Random Weight (RW) and Uniform Weight (UW) initialization strategies. This visual comparison highlights how our optimization method specifically identifies and prioritizes the most reliable classifiers for healthcare diagnostics, rather than relying on static or arbitrary averaging.</p>
                <p> </p>
                <p> 
                    <bold>Q2. The datasets used are reported to have class imbalance. The authors should clarify how this imbalance was addressed during training and evaluation to ensure the results are reliable.</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We appreciate the reviewer highlighting this important aspect of data validity. We have analysed the class distribution for all five datasets used in the study. Four of the datasets exhibit a ratio approximating 60:40, which falls within the range of practical balance where standard classifiers perform effectively without intervention.</p>
                <p> For the dataset exhibiting an imbalance, we empirically evaluated the model's performance without synthetic balancing (such as SMOTE). We have clarified in the Methodology section that a part of the dataset is kept as test data set to test the model performance in unseen data. We observed that the model converged successfully with a negligible gap between training and testing performance metrics (specifically, Recall and F1-score). This indicates that the feature space was sufficiently distinct to allow the model to learn the minority class boundaries effectively. We have clarified that we avoided synthetic oversampling for this specific case to prevent the introduction of noise and to ensure the evaluation reflects the model's robustness on naturally occurring data distributions.</p>
                <p> </p>
                <p> 
                    <bold>Q3. In Figure 9, ROC curves with AUC values near 1.00 may indicate potential overfitting. The authors should verify these results, possibly by evaluating the models on independent or cross-validation datasets to ensure generalizability.</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We agree that AUC values approaching 1.00 warrant careful scrutiny. We have re-verified the results presented in Figure 9. The high AUC values are attributed to the high separability of the datasets, which is consistent with existing literature on the respective datasets.</p>
                <p> Due to strict page length constraints in the submitted manuscript, we could not include the exhaustive Train-vs-Test comparison data for every model variant. However, to address the reviewer&#x2019;s concern, we have provided this detailed analysis below (see Table 1). &#x00a0;As illustrated in Table 1, the performance metrics (especially F1-score, recal,l and precision) for both training and testing phases fall within a consistent range with minimal deviation. The absence of a significant drop in performance from Training to Testing confirms that the model generalizes well to unseen data and is not memorizing the training set. We have added a statement to the Results section clarifying that this stability across splits validates the high AUC scores.</p>
                <p> 
                    <bold>Table 1:</bold> Performance matrices of GBWOEM-R on Breast Cancer Dataset (up to 3 model pairs)</p>
                <p> 
                    <ext-link ext-link-type="uri" xlink:href="https://docs.google.com/spreadsheets/d/1BFQRoqDtJme5ZrmqXKYFwuNuKaGeyq7vQyu6L3k_PYo/edit?usp=sharing">https://docs.google.com/spreadsheets/d/1BFQRoqDtJme5ZrmqXKYFwuNuKaGeyq7vQyu6L3k_PYo/edit?usp=sharing</ext-link>
                </p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report427169">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.186779.r427169</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>PRIYA K</surname>
                        <given-names>HEMA</given-names>
                    </name>
                    <xref ref-type="aff" rid="r427169a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r427169a1">
                    <label>1</label>Easwari Engineering College, Chennai, Tamil Nadu, India</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>20</day>
                <month>11</month>
                <year>2025</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2025 PRIYA K H</copyright-statement>
                <copyright-year>2025</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport427169" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.169436.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>This manuscript presents a novel ensemble learning framework &#x2014; Gradient-Based Weight&#x00a0;Optimized Ensemble Model (GBWOEM)&#x2014;which introduces a gradient-based weight optimization&#x00a0;strategy for improving predictive accuracy in healthcare classification tasks. Two variants&#x00a0;(GBWOEM-R and GBWOEM-U) are developed and evaluated across five diverse healthcare&#x00a0;datasets.</p>
            <p> </p>
            <p> The model is compared with well-established ensemble methods such as AdaBoost,&#x00a0;CatBoost, GradientBoost, LightGBM, and XGBoost. The study is technically sound and&#x00a0;methodologically comprehensive, offering meaningful improvements in prediction accuracy.</p>
            <p> </p>
            <p> However, certain aspects require deeper theoretical justification, statistical validation, and</p>
            <p> refinement to enhance its scientific robustness, clarity, and clinical relevance.</p>
            <p> </p>
            <p> 
                <bold>Observation 1:</bold>The paper outlines the use of gradient descent for weight optimization but lacks a detailed&#x00a0;theoretical rationale for convergence, stability, or hyperparameter selection.</p>
            <p> 
                <bold>Recommendation 1:</bold>Include a mathematical&#x00a0;discussion or citation to establish convergence guarantees, sensitivity analysis, and computationalcomplexity details.</p>
            <p> </p>
            <p> </p>
            <p> 
                <bold>Observation 2:</bold> The study focuses on accuracy but lacks interpretability, crucial for healthcare AI.</p>
            <p> 
                <bold>Recommendation 2:&#x00a0;</bold>&#x00a0;Add analyses&#x00a0;using SHAP, LIME, or feature importance to show clinical relevance.</p>
            <p> </p>
            <p> The manuscript demonstrates strong potential and novelty but requires theoretical, statistical, and&#x00a0;interpretive enhancements. Addressing these revisions will significantly improve its scholarly rigor&#x00a0;and readiness for indexing.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Partly</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Thyroid Disorders, Deep Learning, Machine Learning, RNN, DNN, CNN, AI</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-427169-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Intelligent Fusion of Heuristically Optimized 1DCNN with Weighted Optimized DNN for Thyroid Disorder Prediction Framework</article-title>.
                        <source>
                            <italic>International Journal of Information Technology &amp; Decision Making</italic>
                        </source>.<year>2025</year>;<volume>24</volume>(<issue>05</issue>) :
                        <elocation-id>10.1142/S0219622025500105</elocation-id>
                        <fpage>1397</fpage>-<lpage>1433</lpage>
                        <pub-id pub-id-type="doi">10.1142/S0219622025500105</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-427169-2">
                    <label>2</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Big data-driven optimal weighted fused features-based ensemble learning classifier for thyroid prediction with heuristic algorithm</article-title>.
                        <source>
                            <italic>Journal of Combinatorial Optimization</italic>
                        </source>.<year>2025</year>;<volume>49</volume>(<issue>4</issue>) :
                        <elocation-id>10.1007/s10878-025-01304-4</elocation-id>
                        <pub-id pub-id-type="doi">10.1007/s10878-025-01304-4</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-427169-3">
                    <label>3</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Innovative Framework for Thyroid Disease Detection by Leveraging Hybrid AGTEO Feature Selection and GRU Classification Model</article-title>.
                        <source>
                            <italic>International Research Journal of Multidisciplinary Technovation</italic>
                        </source>.<year>2024</year>;
                        <elocation-id>10.54392/irjmt2439</elocation-id>
                        <fpage>112</fpage>-<lpage>127</lpage>
                        <pub-id pub-id-type="doi">10.54392/irjmt2439</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
    </sub-article>
</article>
