<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.161643.2</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Research Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Internet of things attack detection using machine learning algorithms</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 2; peer review: 2 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Abebe</surname>
                        <given-names>Anduamlak</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0001-1853-6984</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Gebeyehu</surname>
                        <given-names>Seffi</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Alem</surname>
                        <given-names>Abebaw</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Computer Science, Debre Tabor University, Debre Tabor, Amhara, Ethiopia</aff>
                <aff id="a2">
                    <label>2</label>Computer Science, Bahir Dar University, Bahir Dar, Amhara, Ethiopia</aff>
                <aff id="a3">
                    <label>3</label>Information Technology, Debre Tabor University, Debre Tabor, Amhara, Ethiopia</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:anduamlak09@gmail.com">anduamlak09@gmail.com</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>26</day>
                <month>2</month>
                <year>2026</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2025</year>
            </pub-date>
            <volume>14</volume>
            <elocation-id>230</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>24</day>
                    <month>2</month>
                    <year>2026</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Abebe A et al.</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/14-230/pdf"/>
            <abstract>
                <sec>
                    <title>Background</title>
                    <p>The rapid growth of the Internet of Things (IoT) has brought transformative benefits across industries, yet it also presents significant security challenges due to the proliferation of connected devices.</p>
                </sec>
                <sec>
                    <title>Methods</title>
                    <p>This study proposes an artificial intelligence (AI) model leveraging machine learning algorithms to detect and classify multiple types of IoT attacks, including distributed denial of service (DDoS), reconnaissance, brute force, spoofing, and Mirai attacks, using the CICIoT2023 dataset. The dataset was divided into training and testing sets to ensure accurate performance assessment. After training, the models were tested, and their effectiveness was evaluated through metrics like accuracy and confusion matrices.</p>
                </sec>
                <sec>
                    <title>Results and conclusions</title>
                    <p>Among the algorithms used, the decision tree model outperformed than others, achieving an impressive accuracy of 98.34%. In contrast, Bayes classifiers, support vector machines (SVM), and logistic regression achieved accuracy rates of 92%, 91.5%, and 75%, respectively. These results highlight the significant potential of machine learning techniques in detecting and mitigating various IoT attacks, offering promising avenues for enhancing IoT security. The improvement of the performance of the IoT attack detection model using large datasets and the appropriate using deep learning algorithms with their parameters will be our future consideration in the domain.</p>
                </sec>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Internet of Things</kwd>
                <kwd>cyber-attacks</kwd>
                <kwd>Internet of Things security</kwd>
                <kwd>machine learning</kwd>
            </kwd-group>
            <funding-group>
                <funding-statement>The author(s) declared that no grants were involved in supporting this work.</funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Revised</label>
                <title>Amendments from Version 1</title>
                <p>We revised our manuscript by expanding the literature review section and conclusion section adjustment.</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec id="sec4" sec-type="intro">
            <title>1. Introduction</title>
            <p>The Internet of Things (IoT) is a network of hundreds of millions of gadgets that can communicate with one another with little help from users. IoT attack is a type of cyber-attack that targets systems made up of physical things, cars, buildings, and other objects integrated with software that allows them to exchange or collect data.
                <sup>
                    <xref ref-type="bibr" rid="ref1">1</xref>
                </sup> As described by Anwer A. &amp; et al.,
                <sup>
                    <xref ref-type="bibr" rid="ref2">2</xref>
                </sup> there were about 28 billion IoT devices in use in 2018. By 2022, this sum is predicted to reach 49.1 billion, and the IoT is projected to reach a display size of approximately ten trillion. IoT is acknowledged as a technique for appropriate mechanisms connected via servers, sensors, and different software.
                <sup>
                    <xref ref-type="bibr" rid="ref2">2</xref>
                </sup>
            </p>
            <p>According to the Ethiopian Information Network Security Administration (INSA) director report, they saved 23.2 billion birrs by defending against cyber-attacks. During 2022/2023, more than 6,859 cyber-attacks occurred and only 6,768 cyber-attacks got solutions. Banking and financial institutions, national intelligence security services, media institutions, selected governmental institutions, regional offices, health and higher institutions are the most targeted centers. According to the report, website attacks, malware attacks, port scans, distributed denial of service (DDoS), and structured query language (SQL) Injection are the most frequently occurring types of attacks in Ethiopia during 2022/23.
                <sup>
                    <xref ref-type="bibr" rid="ref3">3</xref>
                </sup>
            </p>
            <p>It is difficult to produce IoT security data that is useful for actual applications for several reasons. Having a vast network made up of multiple actual IoT devices, akin to the topologies of actual IoT applications, is one of the primary issues. Due to the widespread adoption of IoT, its inherent mobility, and standardization limitations, numerous researchers have looked into the risks that IoT devices pose to large corporations and smart towns. As a result, smart mechanisms that can automatically detect suspicious movement on IoT devices connected to local networks are required.
                <sup>
                    <xref ref-type="bibr" rid="ref2">2</xref>,
                    <xref ref-type="bibr" rid="ref4">4</xref>
                </sup> The pervasive growth of the IoT creates an expanding attack surface for malicious actors. Detecting these attacks effectively is crucial for securing IoT systems and protecting sensitive data. This paper explored the use of machine learning (ML) for attack detection in IoT environments, focusing on the challenge of imbalanced datasets and potential solutions.</p>
            <p>The IoT has become a crucial component of today&#x2019;s technological landscape, as it allows various devices and systems to connect and communicate with each other over the Internet. This interconnected network of devices has revolutionized many industries, including healthcare, transportation, manufacturing, and smart homes. The IoT has become increasingly significant in today&#x2019;s world by 
                <bold>c</bold>onnecting everyday objects to the Internet, automating tasks and processes, enhancing data-driven decision-making, and creating new opportunities.</p>
            <p>However, the widespread adoption of IoT devices has also introduced new security challenges and vulnerabilities. IoT devices are often designed with limited processing power and memory, making them more susceptible to attacks. Additionally, many IoT devices lack robust security features, such as encryption and secure authentication mechanisms, interconnectedness, and privacy concerns, making them easy targets for cybercriminals. There are different types of attacks targeting IoT devices namely; malware, DoS attacks, man-in-the-middle attacks, botnet attacks, and physical attacks. IoT devices, with their limited processing power, are vulnerable to cyberattacks, making them attractive targets for hackers seeking unauthorized access or control. These devices collect vast amounts of personal data, and inadequate security can lead to serious privacy breaches. Many are integrated into critical infrastructure, meaning attacks can cause widespread disruption and economic damage. Compliance with regulations is essential to avoid legal and reputational consequences. Security flaws in one device can compromise entire networks, emphasizing the need for robust protection. High-profile breaches can erode consumer trust, hinder adoption, and result in significant financial losses. If security risks are not addressed, innovation in IoT may slow down. Ensuring long-term sustainability requires continuous investment in security measures, and collaboration among organizations, developers, and policymakers is crucial for a secure IoT ecosystem.</p>
            <p>The main contributions of this work are summarized as:
                <list list-type="order">
                    <list-item>
                        <label>(1)</label>
                        <p>Prominent result: The proposed model is focusing on evaluating ML algorithms&#x2019; performance using unbalanced datasets and the prominent result was resulted. Moreover, the authors also compared the results from the existed related works and performance has been improved.</p>
                    </list-item>
                    <list-item>
                        <label>(2)</label>
                        <p>Automation and efficiency: ML algorithms can analyze large amounts of IoT network data more quickly and accurately than manual methods. This could enable the detection of attacks in real time, enhancing the security of IoT systems.</p>
                    </list-item>
                    <list-item>
                        <label>(3)</label>
                        <p>Scalability: As the number of IoT devices continues to grow rapidly, ML based systems can scale efficiently to handle large networks with numerous devices, ensuring comprehensive attack identification and protection.</p>
                    </list-item>
                </list>
            </p>
        </sec>
        <sec id="sec5">
            <title>2. Related works</title>
            <p>Several scholars used various methodologies to carry out studies on cyber-attack detection.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref2">2</xref>
                </sup> outlined a methodology for identifying suspicious network activity. They achieved a performance result of 85.34% using a random forest (RF) algorithm. Using the NSL KDD dataset, the suggested framework was used, and the results were compared for training, prediction time, specificity, and accuracy.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref5">5</xref>
                </sup> several detection techniques are assessed using the recently created Bot-IoT dataset. During the implementation stage, seven distinct ML algorithms were employed, with the majority demonstrating exceptional performance. Throughout the deployment, new features were taken from the Bot-IoT dataset.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref6">6</xref>
                </sup> they used six distinct algorithms RF, Logistic Regression (LR), SVM, NB, K-Nearest Neighbors (KNN), and multilayer perceptron (MLP) to conduct a comparative analysis of IoT cyber-attack detection techniques.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref7">7</xref>
                </sup> To effectively detect attacks and abnormalities in IoT systems, the authors of the paper compared the performances of numerous ML models. LR, SVM, decision tree (DT), RF, and artificial neural network (ANN) are the ML algorithms that were employed in this case.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref8">8</xref>
                </sup> they performed IoT behavior classification, monitoring the expected IoT behaviors and evaluating the efficacy of our optimally selected classifiers versus the superset of specialized classifiers by applying them to our IoT traffic traces.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref9">9</xref>
                </sup> the study attempts to secure IoT devices by employing a Raspberry Pi as a honeypot to mimic IoT devices and verify the user&#x2019;s intent, examine various attack patterns, and shield IoT devices from known threats. The purpose of these honeypots is to protect various protocols in IoT devices that are susceptible to assaults.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref10">10</xref>
                </sup> Using an extended topology made up of multiple real IoT devices, they conducted a novel realistic IoT attack dataset, adopting IoT devices as both attackers and victims. They carried out, recorded, and gathered information from 33 attacks against IoT devices, categorized into seven types, and they showed how they could be replicated. Using the CICIoT2023 dataset, they assessed how well ML and deep learning algorithms classified and detected benign or malicious IoT network traffic.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref11">11</xref>
                </sup> applied a hybrid deep learning technique to handle the problem of uneven data classification in attack detection. Convolutional neural networks (CNNs) and long short-term memory (LSTM) networks are two components of a hybrid deep learning model that the authors suggest using to enhance classification performance. They draw attention to the difficulties that imbalanced datasets present in precisely identifying attacks. CNNs are useful for extracting spatial properties from the data, they say, whereas LSTM networks are better at extracting temporal dependencies from sequential data. The hybrid deep learning model&#x2019;s performance is compared with that of conventional ML methods by the authors through experimentation on attack datasets that are not balanced. The results demonstrate that the hybrid deep learning approach outperforms traditional methods in detecting attacks in imbalanced datasets, showcasing the effectiveness of combining CNNs and LSTM networks for improved classification accuracy.</p>
            <p>In their study,
                <sup>
                    <xref ref-type="bibr" rid="ref12">12</xref>
                </sup> explains in detail the many ML methods that are employed to identify IoT botnets. In the IoT ecosystem, botnets pose an increasing threat, as the review emphasizes the significance of IoT security. It covers the many ML techniques and algorithms that have been put forth to identify and lessen IoT botnet threats. To give readers an understanding of the current status of this field of research, the manuscript carefully assesses the advantages and disadvantages of different methodologies. For those working on botnet detection and IoT security, the paper is an invaluable resource overall.</p>
            <p>The study,
                <sup>
                    <xref ref-type="bibr" rid="ref13">13</xref>
                </sup> examined how ML approaches applied to Industrial Internet of Things (IIoT) systems security are affected by imbalanced datasets. To better understand how class imbalances in datasets impact ML models&#x2019; ability to identify security vulnerabilities in IIoT environments, the study looks into how these imbalances may impact model performance and accuracy. Within the framework of IIoT security, it addressed several problems and difficulties associated with unbalanced datasets, including minority class misclassification and biased model predictions. Additionally, to improve the efficacy of machine learning-based security mechanisms in IIoT systems, the book suggests possible approaches and answers to these problems. Overall, the study provided valuable insights into the implications of imbalanced datasets on the security of IIoT and offers recommendations for improving the robustness and reliability of security measures in industrial IoT settings.</p>
            <p>According to Radanliev et al.,
                <sup>
                    <xref ref-type="bibr" rid="ref22">14</xref>
                </sup> as data strategies evolve, dependency models have become increasingly valuable for managing contemporary cyber risk challenges. These models aid in cyber risk estimation and general impact assessments by illustrating the intricate relationships among various digital components. The literature underscores the importance of a comprehensive understanding of cyber risks, particularly in relation to the Internet of Things (IoT), where conventional assessment methods may fall short. The paper advocates for the adoption of innovative risk assessment and management strategies that can effectively address the unique challenges presented by emerging IoT cyber threats. By utilizing these methods, the cybersecurity community can enhance its defenses and better navigate the constantly shifting landscape of digital vulnerabilities.</p>
            <p>According to Radanliev et al.,
                <sup>
                    <xref ref-type="bibr" rid="ref23">15</xref>
                </sup> the study focuses on the role of AI-based Bill of Materials (BOMs) in ensuring the trustworthiness and quality of AI systems, evaluating CHERI&#x2019;s security features for addressing cybersecurity threats, and using AI techniques to identify and analyze threats, exploits, and vulnerabilities in Software Bill of Materials (SBOMs). The results indicate that combining CHERI with AI BOMs significantly improves the security and transparency of AI systems. This integration not only aids in identifying and mitigating specific threats and vulnerabilities but also enhances trust and security within AI systems, highlighting the potential of AI-driven approaches to bolster the security of SBOMs.</p>
            <p>However, the security issue of IoT has not addressed yet and further investigations are required. Therefore, we the authors are focusing on such issues to improve the performances of the existing works and evaluating other ML algorithms in this paper.</p>
        </sec>
        <sec id="sec6" sec-type="methods">
            <title>3. Methods</title>
            <p>This study followed crucial steps illustrated in the proposed IoT attack detection architecture to conduct rigorous experiments, as shown in 
                <xref ref-type="fig" rid="f1">
Figure 1</xref> designed by the authors.</p>
            <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                <label>
Figure 1. </label>
                <caption>
                    <title>Proposed model architectures of IoT attack detection.</title>
                    <p>This figure has been created by the author.</p>
                </caption>
                <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/197072/2a353af9-ba8a-41f4-a370-efaca0579050_figure1.gif"/>
            </fig>
            <sec id="sec7">
                <title>3.1 Dataset information</title>
                <p>One of the most frequent problems faced by ML researchers is locating reliable datasets with the necessary properties. Regardless of the size of the dataset, selecting a specific learning technique is not as crucial as creating a well-cleaned representative dataset.
                    <sup>
                        <xref ref-type="bibr" rid="ref14">16</xref>
                    </sup> In our investigation, we used a distinct IoT attack dataset from the CICIoT2023, which has a total of 221,834 occurrences that were recorded as Comma Separated Values (CSV) files. In our study, 42 relevant features were extracted, and the total dataset was labeled namely Benign Traffic, DDoS, Spoofing, SQL Injection, Recon, and Mirai. The following three key reasons were taken into account why selecting the aforementioned dataset: i) the dataset contains 42 attributes extracted from different categories of IoT attack features; ii) the dataset contains 221,834 dataset instances which are cleaned, imbalanced, and contain the required features as shown in 
                    <xref ref-type="table" rid="T1">
Table 1</xref>; iii) the dataset contains raw datasets so that it is possible to generate new features as needed.</p>
                <table-wrap id="T1" orientation="portrait" position="float">
                    <label>
Table 1. </label>
                    <caption>
                        <title>Dataset information.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">IoT attack classes</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Collected dataset</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Dataset source</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Mirai</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">50,632</td>
                                <td align="left" colspan="1" rowspan="7" valign="top">Canadian Institute for Cyber Security CICIoT2023</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Recon</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">6,094</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">SQL Injection</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">185</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Benign Traffic</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">21102</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">DDoS</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">137,941</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Spoofing</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">5880</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Total dataset</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">221,834</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec id="sec8">
                <title>3.2 Data Preprocessing and feature selection</title>
                <p>Preprocessing data and feature extraction for IoT attack detection with an imbalanced dataset is an important step to ensure the effectiveness of ML approaches. The researcher implemented dimensionality reduction, data splitting, and data cleaning. To ensure its quality and reliability, the researcher handles missing values, outliers, and any inconsistencies in the dataset.</p>
                <p>Feature selection involves selecting and transforming relevant features from the raw data to improve the performance of the ML model. The researcher extracted 42 informative features using principal component analysis techniques.</p>
            </sec>
            <sec id="sec9">
                <title>3.3 Train-test dataset spit ratios</title>
                <p>Train-test dataset splits are required before feeding datasets to the learning algorithms. This is because it&#x2019;s anticipated that learning model(s) would be evaluated using unidentified datasets to assess how well they can forecast new IoT threats. Most studies employed train-test dataset split ratios of 80%:20%.
                    <sup>
                        <xref ref-type="bibr" rid="ref15">17</xref>
                    </sup> However, the study groups could not agree on how much train-test dataset split ratio to use for how many dataset instances. This is why the suggested study chose a dataset split ratio that yields improved training and testing set accuracy for each classifier by using 80%:20% train-test dataset split ratios on each classifier.</p>
                <p>As a result, for our model experiment from the total dataset, we have taken 80% (177,467) of the dataset used for training, and 20% (44,367) used for testing our model performance accuracy.</p>
            </sec>
            <sec id="sec10">
                <title>3.4 Implementation Tools and Algorithms</title>
                <p>The study conducted extensive experiments using Python to test and train the suggested Supervised ML algorithms using high-speed computing. Python was chosen as the implementation language for the study due to its abundance of libraries and packages tailored for ML research.</p>
                <p>We the authors employed four well-known ML algorithms, namely; decision tree, SVM with default parameters, SVM with sigmoid kernel, LR, and Na&#x00ef;ve Bayes
                    <sup>
                        <xref ref-type="bibr" rid="ref16">18</xref>&#x2013;
                        <xref ref-type="bibr" rid="ref19">21</xref>
                    </sup> to identify IoT attacks.</p>
                <p>DTs are versatile and intuitive models that make predictions by recursively splitting the data based on different features. They are known for being interpretable and can handle both categorical and numerical data. We used default DT parameters like Max depth, minimum samples per leaf, splitting criteria, and maximum features per split.</p>
                <p>SVM is a powerful algorithm that separates data points into different classes by finding the best hyperplane that maximizes the margin between the classes. The default parameters refer to the default values set by the algorithm, which may vary depending on the implementation. SVM can also utilize different kernels, such as the sigmoid kernel, which allows for non-linear separation of data points. The sigmoid kernel maps the data into a higher-dimensional space to find a decision boundary.</p>
                <p>Despite its name, LR is a classification algorithm rather than a regression algorithm. It calculates the probability of an instance belonging to a certain class using a logistic function. It&#x2019;s commonly used for binary classification problems. To control the degree of regularization, penalizing complex models, and reducing overfitting we used the regularization parameter (lambda). Chooses gradient descent algorithm used to find the optimal model parameters. Sets the maximum number of iterations for the solver to find the optimal parameters.</p>
                <p>Na&#x00ef;ve Bayes is a probabilistic classifier that calculates the probability of an instance belonging to a particular class based on Bayes&#x2019; theorem, assuming that all features are independent. We used the following key parameters to implement the Na&#x00ef;ve Bayes algorithm for IoT attack detections. Smoothing parameter (Alpha): Adds a small value to the estimated probabilities to avoid division by zero and improve stability, especially with sparse data. Feature selection: Choosing the subset of features most relevant for classification can improve performance and interpretability.</p>
            </sec>
        </sec>
        <sec id="sec11">
            <title>4. Experimental result evaluation</title>
            <sec id="sec12">
                <title>4.1 Evaluation metrics</title>
                <p>It&#x2019;s critical to specify performance metrics appropriate for the task at hand when assessing ML models. We employed the most significant performance metrics for, the accuracy, and confusion matrix to assess our findings.
                    <sup>
                        <xref ref-type="bibr" rid="ref20">22</xref>
                    </sup>
                </p>
                <p>Accuracy is calculated as the sum of two accurate predictions (TP + TN) divided by the total number of data sets (P + N). The best accuracy is 1.0, and the worst is 0.00.
                    <sup>
                        <xref ref-type="bibr" rid="ref20">22</xref>
                    </sup>
                    <disp-formula id="e1">

                        <mml:math display="block">
                            <mml:mtext>Accuracy</mml:mtext>
                            <mml:mo>=</mml:mo>
                            <mml:mfrac>
                                <mml:mrow>
                                    <mml:mi mathvariant="normal">TP</mml:mi>
                                    <mml:mo>+</mml:mo>
                                    <mml:mi mathvariant="normal">TN</mml:mi>
                                </mml:mrow>
                                <mml:mrow>
                                    <mml:mi mathvariant="normal">P</mml:mi>
                                    <mml:mo>+</mml:mo>
                                    <mml:mi mathvariant="normal">N</mml:mi>
                                </mml:mrow>
                            </mml:mfrac>
                        </mml:math>

                        <label>(1)</label>
</disp-formula>
                </p>
            </sec>
            <sec id="sec13">
                <title>4.2 Experimental results and comparisons</title>
                <p>To attain better performance results, we conducted data preprocessing techniques. The dataset is transformed into a structure appropriate for ML using pre-processing data transformation techniques.
                    <sup>
                        <xref ref-type="bibr" rid="ref21">23</xref>
                    </sup> To make the dataset more accurate and efficient, this stage also involves cleaning it by deleting any irrelevant or corrupted data.</p>
                <p>We employed various supervised ML techniques, including LR, DT, SVM, and NB, to carry out this investigation. DT outperformed other ML algorithms by achieving accuracy of 98.34%, as shown in 
                    <xref ref-type="table" rid="T2">
Table 2</xref>.</p>
                <table-wrap id="T2" orientation="portrait" position="float">
                    <label>
Table 2. </label>
                    <caption>
                        <title>Applied ML algorithm performance result.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Machine learning algorithms</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Accuracy %</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Remark</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Decision tree (DT)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">98.34%</td>
                                <td colspan="1" rowspan="1"/>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="2" valign="top">Support Vector Machine (SVM)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">91.5%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">With default hyperparameters</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">69.27%</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">With sigmoid kernel</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Logistic Regression (LR)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75%</td>
                                <td colspan="1" rowspan="1"/>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Na&#x00ef;ve Bayes (NB)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">92%</td>
                                <td colspan="1" rowspan="1"/>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>Accuracy is one of the most relevant performance evaluation metrics in ML as well as deep learning algorithms. This metric is also deployed in this work, as shown in 
                    <xref ref-type="table" rid="T2">
Table 2</xref> that shows DT was the highest-performing algorithm, followed by NB and SVM with default value. SVM with a sigmoid kernel received the lowest performance score of 69.27%, making it the least effective algorithm. Despite having a high-performance score, NB was notably slower than the other algorithms. Graphically, the performance result is shown in 
                    <xref ref-type="fig" rid="f2">
Figure 2</xref>.</p>
                <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                    <label>
Figure 2. </label>
                    <caption>
                        <title>Machine learning approach performance applied to the CICIoT2023 dataset.</title>
                    </caption>
                    <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/197072/2a353af9-ba8a-41f4-a370-efaca0579050_figure2.gif"/>
                </fig>
                <p>In addition to accuracy, confusion matrix is also used to evaluate the performance. An N x N matrix, where N is the total number of target classes, is called a confusion matrix and is used to assess how well a classification model performs. The ML model&#x2019;s predicted outcomes are compared with the actual target values in the matrix. The confusion matrix was obtained when we employed different ML algorithms of SVM, LR, NB, and DT algorithms respectively, as shown in 
                    <xref ref-type="fig" rid="f3">
Figure 3</xref>.</p>
                <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                    <label>
Figure 3. </label>
                    <caption>
                        <title>Confusion matrix obtained in the identification process conducted using different machine learning models (SVM (A), LR (B), NB (C), and DT (D)).</title>
                    </caption>
                    <graphic id="gr3" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/197072/2a353af9-ba8a-41f4-a370-efaca0579050_figure3.gif"/>
                </fig>
                <p>In addition to comparing and evaluating the performance of the ML algorithms deployed in this work, the authors also compared such algorithms with the existed related works, as shown in 
                    <xref ref-type="table" rid="T3">
Table 3</xref>. In most of cases, the performance improvements have been achieved in the state-of-the-art even though there are different limitations and challenges that need further investigations in the domain area.</p>
                <table-wrap id="T3" orientation="portrait" position="float">
                    <label>
Table 3. </label>
                    <caption>
                        <title>Result comparison from the related works.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Related works</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Title of related work</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Methods used</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Performance %</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <sup>
                                        <xref ref-type="bibr" rid="ref5">5</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Internet of Things Cyberattacks Detection Using Machine Learning</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">NB</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">79%</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <sup>
                                        <xref ref-type="bibr" rid="ref2">2</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Attack Detection in IoT Using Machine Learning</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">SVM, RF</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">85.34%</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <sup>
                                        <xref ref-type="bibr" rid="ref4">4</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Cyberattack Detection Using Machine Learning</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">KNN &amp; RF</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">88%</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <sup>
                                        <xref ref-type="bibr" rid="ref7">7</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Attack and anomaly detection in IoT sensors in IoT sites using machine learning approaches</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">DT, RF &amp; ANN</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">99.4%</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <sup>
                                        <xref ref-type="bibr" rid="ref10">10</xref>
                                    </sup>
                                </td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Botnet Attack Detection in IoT Using Machine Learning Technique</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">DT, LR</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">94%</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <bold>Our proposed work</bold>
</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Artificial intelligence model for internet of things attack detection using machine learning algorithms</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <bold>DT, NB, SVM, LR</bold>
</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">
                                    <bold>98.34%</bold>
</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
        </sec>
        <sec id="sec14" sec-type="conclusions">
            <title>5. Conclusions</title>
            <p>IoT security attacks have been a hot issue in recent time. This paper aimed to design a multi-class IoT attack detection model using ML algorithms. The employed four supervised ML algorithms, namely; DT, SVM, LR, and NB were used to address the proposed problem related to identifying IoT attacks. The recent Canadian Institute of Cyber Security CICIoT2023 dataset, which contains the imbalanced instances and multi-class types of attacks with six classes, was used for designing and evaluating the proposed model. The dataset was splited into 80%:20% ratio for training and testing the model, respectively. The experiments are conducted using Python in Google Co-Lab.</p>
            <p>To evaluate the model performance, we used tabular representation (accuracy) and confusion matrix for each employed algorithm. The prominent performance result has been found. In DT, we attained the maximum prediction accuracy rate of 98.34%. DT outperforms SVM at 91.5%, LR at 75%, and Bayes classifiers (NB) at 92%. Our model performs superior accuracy in the prediction of these IoT attacks when compared to other benchmarks of ML classification approaches.</p>
            <p>In the area of IoT threat detection, our suggested model result offers several contributions, including resolving unbalanced data issues, enhancing detection precision, increasing imbalanced data awareness, improving performance, and forwarding future directions in the area. Therefore, the result could be enhancing security, reducing response time, and enabling adaptive defense to provide a significant contribution to the domain of IoT security. The work on IoT security attack identification using ML approaches holds great promise in improving IoT security.</p>
            <p>The findings from the multi-class IoT attack detection model highlight several urgent actions for the industry, including the need to expand and diversify datasets for reliability, build resilience against adversarial attacks, enhance detection precision through continual algorithm refinement, promote awareness and education on IoT security challenges, and foster collaboration among stakeholders, researchers, and cybersecurity experts to strengthen defense mechanisms.</p>
            <p>The design of IoT security attack detection systems faces several limitations. Firstly, the dataset used may be too small or homogeneous, affecting the reliability and general applicability of the assessments. Secondly, adversarial attacks can manipulate IoT network traffic, potentially evading machine learning detection systems and exploiting vulnerabilities within the models or their input data, making accurate detection challenging. Lastly, the study relied solely on machine learning algorithms rather than incorporating deep learning methods, which are crucial for enhancing performance with larger datasets.</p>
            <p>Based on the limitations mentioned earlier, the improvement of the performance of IoT attack detection model using large datasets and the appropriate deep learning algorithms with their parameters will be our future consideration in the domain.</p>
        </sec>
        <sec id="sec15">
            <title>Ethics and consent</title>
            <p>Ethical approval and consent were not required.</p>
        </sec>
    </body>
    <back>
        <sec id="sec18">
            <title>Data availability</title>
            <p>All necessary data available from Kaggle and download it after filling CIC DATASET DOWNLOAD FORM for &#x201c;CIC_IOT_Dataset2023&#x201d; form. 
                <ext-link ext-link-type="uri" xlink:href="https://www.unb.ca/cic/datasets/iotdataset-2023.html">https://www.unb.ca/cic/datasets/iotdataset-2023.html</ext-link>.</p>
        </sec>
        <ref-list>
            <title>References</title>
            <ref id="ref1">
                <label>1</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Abdul-Qawy</surname>
                            <given-names>AS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Magesh</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tadisetty</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>The Internet of Things (IoT): An Overview.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Eng. Res. Appl.</italic>
</source>
                    <year>2015</year>.</mixed-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Tharwat</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Classification assessment methods.</article-title>
                    <source>

                        <italic toggle="yes">Applied Computing and Informatics.</italic>
</source>
                    <year>2020</year>;<volume>17</volume>(<issue>1</issue>):<fpage>168</fpage>&#x2013;<lpage>192</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.aci.2018.08.003</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Belay</surname>
                            <given-names>TE</given-names>
                        </name>
</person-group>:
                    <chapter-title>Web Security Vulnerability Analysis of Ethiopian Government Offices.</chapter-title>
                    <source>

                        <italic toggle="yes">2nd world conference on Engineering and Technology.</italic>
</source>
                    <publisher-loc>Brussels, Belgium</publisher-loc>:<year>2021</year>.</mixed-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Soka</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Cyber attack assessment report in Ethiopia during 2023.</italic>
</source>
                    <publisher-loc>Addis Abeba</publisher-loc>:
                    <publisher-name>INSA-&#x12e8;&#x12a2;&#x1295;&#x134e;&#x122d;&#x121c;&#x123d;&#x1295; &#x1218;&#x1228;&#x1265; &#x12f0;&#x1205;&#x1295;&#x1290;&#x1275; &#x12a0;&#x1235;&#x1270;&#x12f3;&#x12f0;&#x122d;</publisher-name>;<year>2023</year>.</mixed-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Haseeb</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mansoori</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Al-Sahaf</surname>
                            <given-names>H</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>IoT Attacks: Features Identification and Clustering.</chapter-title>
                    <source>

                        <italic toggle="yes">2020 IEEE 19th International Conference on Trust, Security and Privacy in Computing and Communications (TrustCom).</italic>
</source>
                    <publisher-loc>Western Sydney</publisher-loc>:<year>2020</year>.</mixed-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jadel Alsamiri</surname>
                            <given-names>KA</given-names>
                        </name>
</person-group>:
                    <article-title>Internet of Things Cyber Attacks Detection using Machine Learning.</article-title>
                    <source>

                        <italic toggle="yes">(IJACSA) International Journal of Advanced Computer Science and Applications.</italic>
</source>
                    <year>2019</year>;<volume>10</volume>.
                    <pub-id pub-id-type="doi">10.14569/IJACSA.2019.0101280</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Mohammed</surname>
                            <given-names>AHK</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jebamikyous</surname>
                            <given-names>H-H</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>IoT Cyber-Attack Detection: A Comparative Analysis.</article-title>
                    <source>

                        <italic toggle="yes">ACM.</italic>
</source>
                    <year>2021</year>.
                    <pub-id pub-id-type="doi">10.1145/3460620.3460742</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Deepthi Reddy</surname>
                            <given-names>SK</given-names>
                        </name>
</person-group>:
                    <article-title>Cyber Attacks Detection using Machine Learning.</article-title>
                    <source>

                        <italic toggle="yes">Neuroquantology.</italic>
</source>
                    <year>2022</year>.</mixed-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Hasan</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Islam</surname>
                            <given-names>MM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zarif</surname>
                            <given-names>MII</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <source>

                        <italic toggle="yes">Attack and anomaly detection in IoT sensors in IoT sites using machine learning approaches.</italic>
</source>
                    <publisher-name>Elsevier B.V.</publisher-name>;<year>2019</year>.
                    <pub-id pub-id-type="doi">10.1016/j.iot.2019.100059</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Pashamokhtari</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Batista</surname>
                            <given-names>G</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gharakheili</surname>
                            <given-names>HH</given-names>
                        </name>
</person-group>:
                    <article-title>Efficient IoT Traffic Inference: from Multi-View Classification to Progressive Monitoring.</article-title>
                    <source>

                        <italic toggle="yes">ACM Transactions on Internet of Things.</italic>
</source>
                    <year>2023</year>.
                    <pub-id pub-id-type="doi">10.1145/3625306</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Goyal</surname>
                            <given-names>U</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Krishna</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kumar</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>Detection And Prevention Of Cyber Attacks On Multi-purpose IoT Devices Using Honeypot.</chapter-title>
                    <source>

                        <italic toggle="yes">2nd International Conference on &#x201c;Advancement in Electronics &amp; Communication Engineering (AECE 2022)&#x201d;.</italic>
</source>
                    <year>2022</year>.</mixed-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Neto</surname>
                            <given-names>ECP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Dadkhah</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ferreira</surname>
                            <given-names>R</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>CICIoT2023: A Real-Time Dataset and Benchmark for Large-Scale Attacks in IoT Environment.</article-title>
                    <source>

                        <italic toggle="yes">Sensors.</italic>
</source>
                    <year>2023</year>;<volume>23</volume>:<fpage>5941</fpage>. 2023.
                    <pub-id pub-id-type="pmid">37447792</pub-id>
                    <pub-id pub-id-type="doi">10.3390/s23135941</pub-id>
                    <pub-id pub-id-type="pmcid">PMC10346235</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Anwer</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Khan</surname>
                            <given-names>SM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Farooq</surname>
                            <given-names>MU</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Attack Detection in IoT using Machine Learning.</article-title>
                    <source>

                        <italic toggle="yes">Engineering, Technology &amp; Applied Science Research.</italic>
</source>
                    <year>2021</year>;<volume>11</volume>(<issue>3</issue>):<fpage>7273</fpage>&#x2013;<lpage>7278</lpage>.
                    <pub-id pub-id-type="doi">10.48084/etasr.4202</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref22">
                <label>14</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Radanliev</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>De Roure</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Maple</surname>
                            <given-names>C</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>AI security and cyber risk in IoT systems.</article-title>
                    <source>

                        <italic toggle="yes">Front. Big Data.</italic>
</source>
                    <year>2024</year>;<volume>7</volume>.
                    <pub-id pub-id-type="pmid">39449740</pub-id>
                    <pub-id pub-id-type="doi">10.3389/fdata.2024.1402745</pub-id>
                    <pub-id pub-id-type="pmcid">PMC11499169</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref23">
                <label>15</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Radanliev</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Santos</surname>
                            <given-names>O</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Brandon-Jones</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Capability hardware enhanced instructions and artificial intelligence bill of materials in trustworthy artificial intelligence systems: analyzing cybersecurity threats, exploits, and vulnerabilities in new software bills of materials with artificial intelligence.</article-title>
                    <source>

                        <italic toggle="yes">J. Def. Model. Simul. Appl. Methodol. Technol.</italic>
</source>
                    <year>2024</year>;<volume>23</volume>(<issue>1</issue>):<fpage>147</fpage>&#x2013;<lpage>175</lpage>.
                    <pub-id pub-id-type="doi">10.1177/15485129241267919</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref14">
                <label>16</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Laurent Sindayigaya</surname>
                            <given-names>AD</given-names>
                        </name>
</person-group>:
                    <article-title>Machine Learning Algorithms: A Review.</article-title>
                    <source>

                        <italic toggle="yes">International Journal of Science and Research (IJSR).</italic>
</source>
                    <year>2022</year>;<volume>11</volume>:<fpage>1127</fpage>&#x2013;<lpage>1133</lpage>.
                    <issn>2319-7064</issn>.
                    <pub-id pub-id-type="doi">10.21275/SR22815163219</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref15">
                <label>17</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sarke</surname>
                            <given-names>IH</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Machine Learning: Algorithms, Real-World Applications and Research Directions.</italic>
</source>
                    <publisher-name>Springer Nature Singapore</publisher-name>.
                    <pub-id pub-id-type="doi">10.1007/s42979-021-00592-x</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref16">
                <label>18</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Manisha</surname>
                            <given-names>KCJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Manjramkar</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Cyber Security Using Machine Learning Techniques.</article-title>
                    <source>

                        <italic toggle="yes">Advances in Computer Science Research.</italic>
</source>
                    <year>2023</year>.
                    <pub-id pub-id-type="doi">10.2991/978-94-6463-136-4_59</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref17">
                <label>19</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Shaukat</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Luo</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>Cyber Threat Detection Using Machine Learning Techniques: A Performance Evaluation Perspective.</chapter-title>
                    <source>

                        <italic toggle="yes">2020 International Conference on Cyber Warfare and Security (ICCWS).</italic>
</source>
                    <publisher-loc>Islamabad, Pakistan</publisher-loc>:<year>2020</year>.</mixed-citation>
            </ref>
            <ref id="ref18">
                <label>20</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kibreab Adane</surname>
                            <given-names>BB</given-names>
                        </name>
</person-group>:
                    <article-title>Machine learning and deep learning based phishing websites detection: the current gaps and next directions.</article-title>
                    <source>

                        <italic toggle="yes">Review of Computer Engineering Research.</italic>
</source>
                    <year>2022</year>;<volume>9</volume>(<issue>1</issue>):<fpage>13</fpage>&#x2013;<lpage>29</lpage>.
                    <pub-id pub-id-type="doi">10.18488/76.v9i1.2983</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref19">
                <label>21</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Abdullahi</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Baashar</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Alhussian</surname>
                            <given-names>H</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Detecting Cybersecurity Attacks in Internet of Things Using Artificial Intelligence Methods: A Systematic Literature Review.</article-title>
                    <source>

                        <italic toggle="yes">Electronics.</italic>
</source>
                    <year>2022</year>;<volume>11</volume>(<issue>2</issue>):<fpage>198</fpage>. 2022.
                    <pub-id pub-id-type="doi">10.3390/electronics11020198</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref20">
                <label>22</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Nazir</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>He</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>N</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Advancing IoT security: A systematic review of machine learning approaches for the detection of IoT botnets.</article-title>
                    <source>

                        <italic toggle="yes">Journal of King Saud University - Computer and Information Sciences.</italic>
</source>
                    <year>2023</year>;<volume>35</volume>(<issue>10</issue>):<fpage>101820</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.jksuci.2023.101820</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref21">
                <label>23</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zolanvari</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Teixeira</surname>
                            <given-names>MA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jain</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <chapter-title>Effect of Imbalanced Datasets on Security of Industrial IoT Using Machine Learning.</chapter-title>
                    <source>

                        <italic toggle="yes">2018 IEEE International Conference on Intelligence and Security Informatics (ISI).</italic>
</source>
                    <year>2018</year>.</mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report464887">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.197072.r464887</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Gonaygunta</surname>
                        <given-names>Hari</given-names>
                    </name>
                    <xref ref-type="aff" rid="r464887a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r464887a1">
                    <label>1</label>University of the Cumberlands, Williamsburg, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>17</day>
                <month>3</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Gonaygunta H</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport464887" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.161643.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>
                <bold>Summary of the Article:</bold>
            </p>
            <p> The article of the research is on the implementation of several methods of the machine learning algorithm to identify and categorize diverse forms of cybersecurity attacks that occur within the Internet of Things systems. The internet of things is growing exponentially and has been estimated to have several ten trillion connected devices. Such expansion is escalating insecurity threats to a similar proportion. The purpose of the study is to create a multi-class attack detection framework based on the different methods of the machine learning algorithm on a specified set of data related to the CICIoT2023 competition having plenty of attack data of various types, including DDoS, reconnaissance, spoofing, Mirai, SQL injection, and numerous others.</p>
            <p> 
                <bold>A. Develop Literature Review and Framework of Contributions.</bold>
            </p>
            <p> Issue: According to the information provided to the authors by the reviewer, it was suggested that the article may be further elaborated through comparison and contrasting the findings and results of the paper with the recent changes and advances in the sphere of IoT security and attack detection through different models and techniques, specifically using AI and deep learning techniques and models to guarantee cybersecurity and resilience to adversarial attacks and imbalanced data.</p>
            <p> 
                <bold>Recommendations:</bold>
            </p>
            <p> To further enrich the paper, one may compare the results and findings of the paper with the recent developments and advancements of the field of IoT security and attack detection by using different models and techniques, particularly the ones that imply the usage of AI and deep learning models and techniques to guarantee cybersecurity against attacks.</p>
            <p> Furthermore, one may compare the results and findings of the models used in the paper with the recent models, techniques, methods, and approaches including CNNs, LSTM, and others.</p>
            <p> 
                <bold>B. Problem Dataset Limitations and Generalizability.</bold>
            </p>
            <p> Issue: Even though the authors have used a dataset of 221,834 instances of the CICIoT2023 dataset, more details concerning the size of the dataset utilized by the authors could be elaborated and justified by the authors to add more details to the paper.</p>
            <p> 
                <bold>Recommendations:</bold> 
                <list list-type="order">
                    <list-item>
                        <p>Talk about the shortcomings of the dataset, e.g. is it representative of actual IoT traffic? Do the patterns of attack vary enough?</p>
                    </list-item>
                    <list-item>
                        <p>To further prove how generally your models can be applied, perform your models on other datasets or even actual traffic.</p>
                    </list-item>
                    <list-item>
                        <p>Report on the skew of the dataset, where any, by your features selection / augmentation techniques.</p>
                    </list-item>
                </list> 
                <bold>Minor Points:</bold> 
                <list list-type="order">
                    <list-item>
                        <p>Better would be sharing more information about the hyperparameters that were optimized to apply the different machine learning algorithms that were applied in the paper. An example is the depth of decision tree algorithm that was implemented within the paper or the kernel function that was implemented within the SVM algorithm within the paper.</p>
                    </list-item>
                    <list-item>
                        <p>More information on the feature selection procedure that was adopted in the paper would be more helpful. As an example, the aspects that the paper chose to use and the steps of applying the PCA algorithm in the paper.</p>
                    </list-item>
                </list> 
                <bold>Conclusion:</bold>
            </p>
            <p> The article is effectively rooted on experimental ground and confirms its arguments with the outcomes of the experiments to demonstrate the high accuracy of the models in the measurement of attacks with decision trees. However, as the required alterations and enhancements are included in the article, it will contribute to its scientific validity and applicability to the area of IoT security even further.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Partly</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>AI, Block Chain, Cybersecurity, Quantum Computing, ML</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report370251">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.177702.r370251</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Radanliev</surname>
                        <given-names>Petar</given-names>
                    </name>
                    <xref ref-type="aff" rid="r370251a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0001-5629-6857</uri>
                </contrib>
                <aff id="r370251a1">
                    <label>1</label>University of Oxford, Oxford, England, UK</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>17</day>
                <month>3</month>
                <year>2025</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2025 Radanliev P</copyright-statement>
                <copyright-year>2025</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport370251" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.161643.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The article is well-structured and well-written. It deserves consideration for indexing. There are some corrections, which I outline in more detail below:&#x00a0;</p>
            <p> </p>
            <p> The article is a bit short, I am not certain about the journal page limit, but if you have space, try to expand with a focus on contribution. One way to improve your contributions is to improve your review and compare existing literature and knowledge. For example,&#x00a0;you have done a great job reviewing so many articles, but only a few articles on cyber risk from future developments in new technologies, such as AI, which seems to be all the rage at the moment. There are recent articles on this topic that review recent and relevant literature, for example, on the related topic of cybersecurity threats, exploits, and vulnerabilities in new software bills of materials with artificial intelligence - see: [Ref 1]&#x00a0;and on the related topic of&#x00a0; &#x2018;AI security and cyber risk in IoT systems&#x2019; - see: [Ref 2] It would be interesting to see a few sentences reviewing and comparing your work in relations to these recent studies in related topics.</p>
            <p> </p>
            <p> - in conclusion, could you highlight your conclusions on what urgent measures can be taken to help the industry adapt to these findings?&#x00a0;</p>
            <p> </p>
            <p> I hope the comments and feedback are helpful, and well done for writing such an interesting article. I am looking forward to reading the updated version.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>I cannot comment. A qualified statistician is required.</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Partly</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>AI security, IoT, cyber risk, blockchchain security, post-quantum cryptography.</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-370251-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Capability hardware enhanced instructions and artificial intelligence bill of materials in trustworthy artificial intelligence systems: analyzing cybersecurity threats, exploits, and vulnerabilities in new software bills of materials with artificial intelligence</article-title>.
                        <source>
                            <italic>The Journal of Defense Modeling and Simulation: Applications, Methodology, Technology</italic>
                        </source>.<year>2024</year>;
                        <elocation-id>10.1177/15485129241267919</elocation-id>
                        <pub-id pub-id-type="doi">10.1177/15485129241267919</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-370251-2">
                    <label>2</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>AI security and cyber risk in IoT systems.</article-title>
                        <source>
                            <italic>Front Big Data</italic>
                        </source>.<year>2024</year>;<volume>7</volume>:
                        <elocation-id>10.3389/fdata.2024.1402745</elocation-id>
                        <fpage>1402745</fpage>
                        <pub-id pub-id-type="pmid">39449740</pub-id>
                        <pub-id pub-id-type="doi">10.3389/fdata.2024.1402745</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
        <sub-article article-type="response" id="comment13575-370251">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Abebe</surname>
                            <given-names>Anduamlak</given-names>
                        </name>
                        <aff>Computer Science, Debre Tabor University, Debre Tabor, Amhara, Ethiopia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No any competing interest</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>17</day>
                    <month>3</month>
                    <year>2025</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Thank you for your constructive comment. We acknowledge the reviewer&#x2019;s concerns regarding to expansion of existing literature and knowledge&#x00a0;comparision.&#x00a0; We also acknowledge the reviewer&#x2019;s concerns regarding the conclusion section.&#x00a0;</p>
                <p> We will revise as per your comment.</p>
            </body>
        </sub-article>
    </sub-article>
</article>
