<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="other" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.149391.2</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Software Tool Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Leveraging Quadratic Polynomials in Python for Advanced Data Analysis</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 2; peer review: 2 approved]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Sipakov</surname>
                        <given-names>Rostyslav</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-0862-5043</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Voloshkina</surname>
                        <given-names>Olena</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-3671-4449</uri>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Kovalova</surname>
                        <given-names>Anastasiia</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Department of Environmental Protection and Occupational Safety Technologies, Kyiv National University of Construction and Architecture, Kyiv, 03037, Ukraine</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:sipakov.rv@knuba.edu.ua">sipakov.rv@knuba.edu.ua</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>Dr. Sipakov is affiliated with CoastalQuant, Inc., which has funded this research. Although the opinions expressed in this paper are those of the authors, they may be influenced by the interests of CoastalQuant, Inc., its clients, affiliates, or employees.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>20</day>
                <month>8</month>
                <year>2024</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2024</year>
            </pub-date>
            <volume>13</volume>
            <elocation-id>490</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>2</day>
                    <month>8</month>
                    <year>2024</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2024 Sipakov R et al.</copyright-statement>
                <copyright-year>2024</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/13-490/pdf"/>
            <abstract>
                <p>This research explores the application of quadratic polynomials in Python for advanced data analysis. The study demonstrates how quadratic models can effectively capture nonlinear relationships in complex datasets by leveraging Python libraries such as NumPy, Matplotlib, scikit-learn, and Pandas. The methodology involves fitting quadratic polynomials to the data using least-squares regression and evaluating the model fit using the coefficient of determination (R-squared). The results highlight the strong performance of the quadratic polynomial fit, as evidenced by high R-squared values, indicating the model&#x2019;s ability to explain a substantial proportion of the data variability. Comparisons with linear and cubic models further underscore the quadratic model&#x2019;s balance between simplicity and precision for many practical applications. The study also acknowledges the limitations of quadratic polynomials and proposes future research directions to enhance their accuracy and efficiency for diverse data analysis tasks. This research bridges the gap between theoretical concepts and practical implementation, providing an accessible Python-based tool for leveraging quadratic polynomials in data analysis.</p>
            </abstract>
            <abstract abstract-type="plain-language-summary">
                <title>Plain Language Summary</title>
                <p>This study examines how quadratic polynomials, which are mathematical equations used to model and understand patterns in data, can be effectively applied using Python, a versatile programming language with libraries suited for mathematical and visual analysis. Researchers have focused on the adaptability of these polynomials in various fields, from software analytics to materials science, in order to provide practical Python code examples. They also discussed the predictive accuracy of the method, confirmed through a statistical measure called R-squared, and acknowledged the need for future research to integrate more complex models for richer data interpretation.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>python</kwd>
                <kwd>quadratic polynomials</kwd>
                <kwd>analyzing data</kwd>
                <kwd>polynomial model</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1">
                    <funding-source>CoastalQuant, Inc. (Tampa, FL, U.S.)</funding-source>
                </award-group>
                <funding-statement>This work was supported by CoastalQuant, Inc. (Tampa, FL, USA). </funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Revised</label>
                <title>Amendments from Version 1</title>
                <p>This revised version of the article includes several significant enhancements based on the reviewer's feedback. Introduction: This paper highlights quadratic polynomials' unique advantages in capturing curvature and non-linear relationships. It also includes a brief comparison with other models, such as linear and cubic polynomials, emphasizing specific scenarios where quadratic polynomials are most effective. Data Preprocessing Steps:&#x00a0;A new subsection has been added detailing the preprocessing steps undertaken before fitting the quadratic model. This includes techniques for handling missing data, detecting and treating outliers, and applying data normalization or scaling. This addition aims to provide a clearer understanding of the steps taken to prepare the data for analysis. Discussion of R-squared Limitations: The methods section now contains a paragraph discussing the limitations of using R-squared as the sole measure of model fit. It suggests additional metrics such as Adjusted R-squared, Mean Squared Error (MSE), and Root Mean Squared Error (RMSE) to offer a more comprehensive evaluation of model performance. Results: A new section has been included comparing the performance of quadratic polynomials with linear and cubic models using the same datasets. The comparison uses metrics like R-squared, Adjusted R-squared, and MSE to evaluate the fit and predictive accuracy, providing a broader perspective on the effectiveness of quadratic models. Discussion: The discussion now delves deeper into the potential challenges and limitations of quadratic polynomials, such as overfitting and sensitivity to data variability. It addresses scenarios where quadratic polynomials might overfit, particularly with small or noisy datasets, and suggests methods for mitigating these issues, including regularization techniques and cross-validation methods. This addition aims to provide a more balanced view of the use of quadratic polynomials in data analysis. Figures: all Figures have been revised.</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec id="sec1" sec-type="intro">
            <title>1. Introduction</title>
            <p>In exploring the quadratic polynomials used in various applications in Python for data analysis, we found significant contributions across various domains, exemplifying their utility and versatility. Quadratic polynomials have been found to be extensively valuable in fields such as physics, fluid mechanics, and chemical reaction modeling due to their effectiveness in capturing non-linearities.</p>
            <p>The primary advantage of quadratic polynomials lies in their ability to capture curvature, allowing them to model complex patterns beyond the reach of traditional linear models. This capacity to represent curved relationships is crucial for accurately depicting trends in data, particularly when there are significant changes in the rate of increase or decrease. Despite their ability to handle non-linear relationships, quadratic polynomials remain relatively simple and interpretable (
                <xref ref-type="bibr" rid="ref14">Fuchs et al., 2009</xref>). Additionally, they are computationally efficient compared to higher-degree polynomials or more complex non-linear models. For example, theoretical physics has employed actions quadratic in curvature and polynomial in variables to effectively describe observer spaces (
                <xref ref-type="bibr" rid="ref12">Koivisto et al., 2019</xref>). In computer science, quadratic polynomial interpolation has been applied in 3D path planning to derive continuous paths for each axis (
                <xref ref-type="bibr" rid="ref13">Chang &amp; Huh, 2015</xref>). When compared to linear and cubic polynomials, quadratic polynomials are particularly useful in scenarios where relationships are non-linear but not overly complex to necessitate higher-order polynomials. Linear models struggle to capture curvature and non-linear patterns, while cubic polynomials may introduce unnecessary complexity where a quadratic model would suffice (
                <xref ref-type="bibr" rid="ref15">Gibert et al., 2000</xref>).</p>
            <p>As mentioned above, the use of quadratic polynomials in modeling has proven beneficial in various applications. 
                <xref ref-type="bibr" rid="ref4">Aladesanmi et al. (2021)</xref> illustrated the adaptability of quadratic polynomials in material science and applied these models to understand the wear rate and hardness of Ti and TiB2 nanocomposites. Their research findings, indicating a better fit for the quadratic model with an adjusted R-squared value of 0.8883, underscores the utility of quadratic polynomials in material science research. In epidemiology, 
                <xref ref-type="bibr" rid="ref5">Yadav (2020)</xref> leveraged quadratic polynomial regression models to analyze the COVID-19 epidemic in India, demonstrating its effectiveness in epidemic forecasting. This example reflects the predictive power of mathematical models and their crucial role in public health planning and responses (
                <xref ref-type="bibr" rid="ref5">Yadav, 2020</xref>
                <italic toggle="yes">).</italic> In the context of urban development and assessment of geotechnical conditions, the incorporation of Python for data analysis, particularly through quadratic polynomials, can significantly enhance the understanding and monitoring of complex ground conditions (
                <xref ref-type="bibr" rid="ref6">Kaliukh et al., 2022</xref>). In the context of quadratic polynomial regression, it is essential to note that quadratic polynomial step regression is an advanced tool capable of utilizing orthogonal experimental data to build a regression model, while avoiding instability in the regression coefficients owing to the multicollinearity of the variables (
                <xref ref-type="bibr" rid="ref14">Wang et al., 2014</xref>). This highlights the potential of quadratic polynomials for handling complex data relationships and providing accurate regression models. 
                <xref ref-type="bibr" rid="ref12">Gong and Zhang (2021)</xref> developed a polynomial regression model to predict Python usage trends. Their model, which demonstrated high accuracy with a training set score of 0.912862 and a test set score of 0.886600, highlighted the effectiveness of quadratic polynomials in forecasting software usage patterns (
                <xref ref-type="bibr" rid="ref12">Gong and Zhang, 2021</xref>)
                <italic toggle="yes">.</italic>
            </p>
            <p>Python, a high-level programming language, provides an ideal environment for the rapid prototyping of data analytic tools and includes powerful tools for visualization, data sharing, and statistical analysis, such as Matplotlib, iPython, NumPy, and SciPy (
                <xref ref-type="bibr" rid="ref2">Alexander et al., 2017</xref>). 
                <xref ref-type="bibr" rid="ref12">Gong and Zhang (2021)</xref> presented a compelling application for predicting Python usage trends and demonstrated a robust model fit with practical implications for software analytics. In summary, Python, with its extensive libraries and capabilities for rapid prototyping, visualization, and scientific computation, provides a robust platform for leveraging quadratic polynomials in advanced data analysis tasks. In summary, Python, with its extensive libraries and capabilities for rapid prototyping, visualization, and scientific computation, provides a robust platform for leveraging quadratic polynomials in advanced data analysis tasks.</p>
        </sec>
        <sec id="sec2" sec-type="methods">
            <title>2. Methods</title>
            <sec id="sec3">
                <title>2.1 Design and development environment</title>
                <p>In this study, we focused on applying quadratic polynomials in Python for data analysis, highlighting the importance of these mathematical expressions in modeling and interpreting complex datasets using the following key concepts:
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>Quadratic polynomials: Defined by the general form 
                                <inline-formula>
                                    <mml:math display="inline">
                                        <mml:msup>
                                            <mml:mrow>
                                                <mml:mi>a</mml:mi>
                                                <mml:mi>x</mml:mi>
                                            </mml:mrow>
                                            <mml:mn>2</mml:mn>
                                        </mml:msup>
                                        <mml:mo>+</mml:mo>
                                        <mml:mi mathvariant="italic">bx</mml:mi>
                                        <mml:mo>+</mml:mo>
                                        <mml:mi>c</mml:mi>
                                    </mml:math>
                                </inline-formula>, where 
                                <inline-formula>
                                    <mml:math display="inline">
                                        <mml:mrow>
                                            <mml:mo stretchy="true">(</mml:mo>
                                            <mml:mi>a</mml:mi>
                                            <mml:mo stretchy="true">)</mml:mo>
                                        </mml:mrow>
                                        <mml:mo>,</mml:mo>
                                        <mml:mrow>
                                            <mml:mo stretchy="true">(</mml:mo>
                                            <mml:mi>b</mml:mi>
                                            <mml:mo stretchy="true">)</mml:mo>
                                        </mml:mrow>
                                        <mml:mo>,</mml:mo>
                                        <mml:mrow>
                                            <mml:mo stretchy="true">(</mml:mo>
                                            <mml:mi>c</mml:mi>
                                            <mml:mo stretchy="true">)</mml:mo>
                                        </mml:mrow>
                                    </mml:math>
                                </inline-formula>, are coefficients. These polynomials are essential for capturing curvature in datasets indicative of various natural and human-made phenomena.</p>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>Python libraries: NumPy is open source and is available&#x00a0;at 
                                <ext-link ext-link-type="uri" xlink:href="https://numpy.org">https://numpy.org</ext-link>, were used for numerical computations, and Matplotlib also is open source and is available at 
                                <ext-link ext-link-type="uri" xlink:href="https://matplotlib.org">https://matplotlib.org</ext-link>), was used to plot the data and polynomial curves, showing how these tools were integrated for data analysis. Additionally, we applied the following open source libraries: &#x201c;scikit-learn&#x201d; is a popular machine learning library in Python that offers a plethora of features that make it a preferred choice for machine learning practitioners, available at 
                                <ext-link ext-link-type="uri" xlink:href="https://scikit-learn.org/">https://scikit-learn.org/</ext-link>, and Pandas, which is a powerful tool in Python for data manipulation and analysis, and available at 
                                <ext-link ext-link-type="uri" xlink:href="https://pandas.pydata.org/">https://pandas.pydata.org/</ext-link>.</p>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>Regression analysis: Explains how quadratic polynomials can be fitted to data points to model relationships within the data, emphasizing practical applications through Python coding examples.</p>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>Coefficient of determination (R-squared): Discuss the computation and interpretation of R-squared to measure how well the polynomial model fits the data.</p>
                        </list-item>
                    </list>
                </p>
                <p>A quadratic polynomial is an algebraic equation of the second degree, which includes a term raised to a power of two (squared). The general form of a quadratic polynomial is
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mspace width="0.25em"/>
                            <mml:mi>y</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mi>a</mml:mi>
                            <mml:msup>
                                <mml:mi>x</mml:mi>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                            <mml:mo>+</mml:mo>
                            <mml:mi mathvariant="italic">bx</mml:mi>
                            <mml:mo>+</mml:mo>
                            <mml:mi>c</mml:mi>
                        </mml:math>
                    </inline-formula>, where 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>y</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> is the dependent variable; 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>x</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> is the independent variable; and 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>a</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>,</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>b</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>,</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>c</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> are the coefficients of the polynomial estimated by the regression model. The quadratic term (
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mi>a</mml:mi>
                            <mml:msup>
                                <mml:mi>x</mml:mi>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                            <mml:mo stretchy="true">)</mml:mo>
                        </mml:math>
                    </inline-formula> allows the model to capture the curvature in the data, which is indicative of acceleration increases or decreases that are common in many natural phenomena.</p>
                <p>Some key features of quadratic polynomials are that they have two terms with a variable 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>x</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> - one is 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>x</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> - squared, and the other is 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>x</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> to the first power. The 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>x</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> term has a non-zero coefficient 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>a</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula>. This makes it a quadratic polynomial rather than a linear polynomial. When plotted, quadratic polynomials form a parabolic shape rather than a straight line. The quadratic polynomials have up to two distinct real roots for the equation 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:msup>
                                <mml:mi>x</mml:mi>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                            <mml:mo>+</mml:mo>
                            <mml:mi mathvariant="italic">bx</mml:mi>
                            <mml:mo>+</mml:mo>
                            <mml:mi>c</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mn>0</mml:mn>
                        </mml:math>
                    </inline-formula>. These solutions were obtained by factoring or by using a quadratic formula. Examples of quadratic polynomials include the vertex form 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mi>y</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mi>a</mml:mi>
                            <mml:msup>
                                <mml:mrow>
                                    <mml:mo stretchy="true">(</mml:mo>
                                    <mml:mi>x</mml:mi>
                                    <mml:mo>&#x2212;</mml:mo>
                                    <mml:mi>h</mml:mi>
                                    <mml:mo stretchy="true">)</mml:mo>
                                </mml:mrow>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                            <mml:mo>+</mml:mo>
                            <mml:mi>k</mml:mi>
                        </mml:math>
                    </inline-formula>, and the standard form 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mi>y</mml:mi>
                            <mml:mo>=</mml:mo>
                            <mml:mi>a</mml:mi>
                            <mml:msup>
                                <mml:mi>x</mml:mi>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                            <mml:mo>+</mml:mo>
                            <mml:mi mathvariant="italic">bx</mml:mi>
                            <mml:mo>+</mml:mo>
                            <mml:mi>c</mml:mi>
                        </mml:math>
                    </inline-formula>. A quadratic polynomial has a squared, linear, and constant term, graphs as a parabola, and two roots at most.</p>
                <p>Understanding their structures allows many mathematical and real-world problems to be solved. We provide an example of the Python script below, which employs a quadratic polynomial fitting technique&#x2013;a method used in regression analysis to model the relationship between a dependent variable and one or more independent variables. In this case, the independent variable is time (represented in months), and the dependent variable is the metric of interest (such as pollution levels).</p>
                <p>After fitting the quadratic polynomial to the data, the script generated a smooth fitted curve that represented the estimated values of the dependent variable across a range of independent variables. This curve helps to visualize the overall trend and any potential seasonal patterns or anomalies in the dataset.</p>
                <p>The coefficient of determination, commonly known as R-squared 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>R</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula>, was then calculated to quantify the goodness of fit of the polynomial model. It is a statistical measure that indicates the proportion of variance in the dependent variable that is predictable from independent variable(s). An 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>R</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> value of one (1) indicated a perfect fit, indicating that the model explained all the data variability around its mean. In contrast, an 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>R</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> value closer to zero (0) indicates that the model fails to accurately model the data.</p>
                <p>For more in-depth information on quadratic polynomial fitting and calculation of the coefficient of determination, the following sources (
                    <xref ref-type="bibr" rid="ref7">Norman R. Draper and Harry Smith, 2014</xref>; 
                    <xref ref-type="bibr" rid="ref8">Douglas et al., 2021</xref>) provide a comprehensive overview of seminal works on regression analysis and detailed explanations of various regression techniques, including quadratic polynomial fitting and interpretation 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>R</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula>.</p>
                <p>Next, we applied quadratic polynomial fitting and R-squared in Python for the data analysis.</p>
                <p>In this case, the Python script exemplifies the application of regression analysis using the NumPy, Matplotlib, scikit-learn, and Pandas libraries to model and visualize trends in time-series data. A core component of this analysis is the fitting of a quadratic polynomial to the data, grounded in the principles of statistical learning.</p>
                <p>The schematic block diagram on 
                    <xref ref-type="fig" rid="f1">Figure 1</xref> shows the framework of the explanted application in this research: implementing quadratic polynomials in Python for advanced data analysis.</p>
                <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                    <label>Figure 1. </label>
                    <caption>
                        <title>The schematic block diagram of the implementing quadratic polynomials in python for advanced data analysis.</title>
                    </caption>
                    <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/169942/7b98933b-927e-4eb2-b174-a59720c471f8_figure1.gif"/>
                </fig>
            </sec>
            <sec id="sec4">
                <title>2.2 Data preprocessing</title>
                <p>
                    <bold>
                        <italic toggle="yes">2.2.1 Handling missing data</italic>
                    </bold>
                </p>
                <p>Before fitting the quadratic model, it is crucial to address any missing values in the dataset to ensure the accuracy and reliability of the model. Common techniques for handling missing data include:
                    <list list-type="alpha-lower">
                        <list-item>
                            <label>a.</label>
                            <p>Removal of missing values</p>
                            <p>This involves deleting rows or columns that contain missing values. This method is straightforward but may lead to loss of valuable information if the dataset has many missing entries. The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace># Removing rows with missing values</monospace>

                                    <monospace>data_cleaned = data.dropna()</monospace>
                                </preformat>
</p>
                        </list-item>
                        <list-item>
                            <label>b.</label>
                            <p>Imputation</p>
                            <p>This technique fills in missing values with plausible data. Common imputation methods include:</p>
                            <p>
                                <bold>Mean or Median Imputation -</bold> Replaces missing values with the mean or median of the column. The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace># Mean or Media Imputation</monospace>

                                    <monospace>data['column_name'].fillna (data['column_name'].mean(), inplace=True)</monospace>
                                </preformat>
</p>
                            <p>
                                <bold>Forward or Backward Fill - Uses previous or next observation to fill missing values.</bold> The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace># Forward or Backward Fill</monospace>

                                    <monospace>data.fillna(method='ffill', inplace=True)</monospace>
                                </preformat>
</p>
                        </list-item>
                    </list>
                </p>
                <p>In the context of machine learning, the exclusion of rows containing missing values without the application of imputation techniques can result in substantial data attrition, particularly in datasets with a high incidence of missing entries. This practice can diminish the statistical power of the analysis and introduce bias into the results. Imputation mitigates this bias by populating missing values with plausible data points, thus enabling the model to utilize the maximum amount of available data. Models that are trained on complete datasets, including imputed values, exhibit greater consistency and robustness compared to those trained on datasets with omitted missing values (
                    <xref ref-type="bibr" rid="ref20">Liu et al., 2020</xref>; 
                    <xref ref-type="bibr" rid="ref21">Dubey &amp; Rasool, 2021</xref>).</p>
                <p>For numerical data, simple imputation methods, such as substituting missing values with the mean or median, are both effective and straightforward. This approach operates under the assumption that the data is missing at random, thereby not introducing significant bias. In the context of more complex datasets, advanced imputation techniques, including K-Nearest Neighbors (KNN), regression imputation, or multiple imputation, can yield more accurate estimations of missing values (
                    <xref ref-type="bibr" rid="ref18">Suh &amp; Song, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref19">Karrar, 2022</xref>). It is important to note that numerous machine learning algorithms are incapable of processing missing data and will either fail or generate errors in the presence of such data (
                    <xref ref-type="bibr" rid="ref17">Fleck et al., 2019</xref>). Imputation ensures the completeness and compatibility of the dataset with these algorithms.</p>
                <p>Appropriate imputation techniques are crucial for preserving the inherent relationships and variability within the data, which in turn enhances the accuracy and reliability of the resulting models.</p>
                <p>Let&#x2019;s consider a situation where we are analyzing the impact of outdoor air pollution at a highway intersection on different days of the week. Depending on various factors, data may not always be recorded daily. Thus, when analyzing a dataset for an entire calendar year, simply removing rows with missing data would not provide a complete assessment of the full year. Imputation allows us to fill these gaps, maintaining a complete and continuous dataset for analysis. For real practice cases, for example, the incidence of secondary air pollution by formaldehyde, arising from photochemical reactions in urban environments, is exhibiting an increasing trend (
                    <xref ref-type="bibr" rid="ref16">Voloshkina et al., 2019</xref>). To accurately assess non-carcinogenic and carcinogenic risks and thereby mitigate disease incidence in the population, it is imperative to utilize the most comprehensive datasets of air pollution parameters (
                    <xref ref-type="bibr" rid="ref22">Sipakov et al., 2018</xref>). However, obtaining such extensive datasets is often not technically feasible. In such scenarios, the aforementioned imputation can play a pivotal role in addressing these data deficiencies.</p>
                <p>Additionally, we would like to note that in the context of the dataset and its analysis, the user needs to determine what is most appropriate for the given case: the technique of removing rows with missing values or imputation based on a number of factors. With a small amount of missing data, up to 5 percent, removing such rows from the dataset will not significantly impact the analysis results. However, with a large amount of missing data, more than 5 percent, simply deleting rows can lead to a significant loss of information, making imputation the most appropriate option. If the data in the dataset under consideration is missing randomly, filling in using the mean or median value may be a more effective method. If there is a pattern in the missing data (for example, specific days of the week), more complex filling methods specific to the particular domain will be required. However, it is important to pay significant attention to the specific application of the dataset. For example, if we are analyzing daily air pollution indicators collected every day, data from Monday to Thursday from 8 AM to 5 PM in urban areas will likely be similar to each other under stable weather conditions. But they can differ significantly with changes in weather conditions, day of the week (Monday vs. Saturday), and time of day (day vs. night), particularly in terms of traffic congestion on highways, for instance.</p>
                <p>
                    <bold>
                        <italic toggle="yes">2.2.2 Outlier detection and treatment</italic>
                    </bold>
                </p>
                <p>While collecting data from air pollution sensor recorders, we encountered anomalous readings that were either significantly lower or higher than expected. This could be due to temporary equipment malfunctions or sensor contamination. Therefore, in addition to removing empty rows from the dataset, we must process rows containing outlier data.</p>
                <p>Outliers are data points that differ significantly from other observations. They can significantly affect the performance of the quadratic model and distort its results, making it essential to detect and handle them properly (
                    <xref ref-type="bibr" rid="ref26">Yerlikaya-&#x00d6;zkurt et al., 2016</xref>).</p>
                <p>Various methods have been proposed to detect outliers, such as nonparametric approaches and robust regression techniques (
                    <xref ref-type="bibr" rid="ref23">Fan et al., 2006</xref>; 
                    <xref ref-type="bibr" rid="ref24">Toshiaki et al., 2021</xref>). These methods aim to identify and remove outliers effectively to ensure the robustness of the analysis. Outlier detection often involves comparing the local density of data points to that of their neighbors, highlighting the importance of considering the context of neighboring points (
                    <xref ref-type="bibr" rid="ref25">Latecki et al., 2007</xref>).</p>
                <p>Our study will examine two main methods to detect outliers: statistical and data normalization or scaling. Normalization or scaling ensures that different features contribute equally to the analysis, which is crucial when features have varying units or scales.
                    <list list-type="alpha-lower">
                        <list-item>
                            <label>a.</label>
                            <p>Z-score method</p>
                            <p>The Z-score method is a commonly used statistical technique for identifying outliers in data by measuring how many standard deviations a data point is from the mean. Data points with Z-scores greater than 3 or less than -3 are typically considered outliers (
                                <xref ref-type="bibr" rid="ref27">Yaro et al., 2024</xref>). To enhance the Z-score method, a modified Z-score based on the median can be utilized to improve robustness, especially when dealing with data values that significantly differ from the mean (
                                <xref ref-type="bibr" rid="ref28">&#x00c7;ILGIN et al., 2023</xref>). This modification helps mitigate the sensitivity of traditional Z-scores to extreme data values. Despite the fact that this method has a preference over more recent techniques due to its simplicity and reliability, it is essential to recognize that the Z-score method may be vulnerable to masking effects, where the presence of outliers can distort the sample mean and variance, potentially concealing other outliers within the data. Therefore, while the Z-score method holds significant value, it is imperative to be aware of its limitations and to consider employing supplementary techniques for a more comprehensive outlier detection strategy. The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace>
                                        <italic toggle="yes">#</italic> Z-Score Method</monospace>

                                    <monospace>z_scores = stats.zscore(data['column_name'])</monospace>

                                    <monospace>abs_z_scores = np.abs(z_scores)</monospace>

                                    <monospace>filtered_entries = (abs_z_scores &lt; 3)</monospace>

                                    <monospace>data_cleaned = data [filtered_entries]</monospace>
                                </preformat>
</p>
                        </list-item>
                        <list-item>
                            <label>b.</label>
                            <p>The Interquartile Range (IQR)</p>
                            <p>The Interquartile Range (IQR) method is a statistical technique used to detect outliers in a dataset. It involves calculating the IQR, which is the difference between the 75th percentile (Q3) and the 25th percentile (Q1) of the data. Data points that fall outside the range of Q1-1.5 * IQR and Q3 + 1.5 * IQR are considered outliers. This is a common rule of thumb known as the 1.5 IQR rule, which is widely used in various fields such as data science, environmental monitoring, and outlier detection in different applications. For example, in the assessment of ICESat-2 laser altimeter data for water-level measurement, the IQR method was applied to detect outliers (
                                <xref ref-type="bibr" rid="ref29">Cui et al., 2020</xref>). The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace># The Interquartile Range (IQR)</monospace>

                                    <monospace>Q1 = data['column_name'].quantile(0.25)</monospace>

                                    <monospace>Q3 = data['column_name'].quantile(0.75)</monospace>

                                    <monospace>IQR = Q3 - Q1</monospace>

                                    <monospace>filter = (data['column_name'] &gt;= Q1-1.5 * IQR) &amp; (data['column_name'] &lt;= Q3 + 1.5 * IQR)</monospace>

                                    <monospace>data_cleaned = data.loc [filter]</monospace>
                                </preformat>
</p>
                        </list-item>
                    </list>
                </p>
                <p>
                    <list list-type="alpha-lower">
                        <list-item>
                            <label>c.</label>
                            <p>Min-max scaling</p>
                            <p>Min-max scaling, also known as min-max normalization, is a data normalization technique that transforms features so that they fall within a specific range, typically between 0 and 1 (
                                <xref ref-type="bibr" rid="ref30">Ampomah et al., 2021</xref>). This method entails rescaling data to ensure it lies within the interval of zero to one, facilitating a standardized comparison of values both before and subsequent to processing. Min-max normalization is particularly critical in data preprocessing as it preserves the relationships among the original data points while ensuring they reside within a consistent range. The min-max normalization technique effectively scales the data to conform to these specified boundaries by determining the new minimum and maximum values. Researchers have highlighted the significance of min-max normalization in various fields, such as machine learning, where it is considered one of the most common tools for data normalization (
                                <xref ref-type="bibr" rid="ref31">Gertz et al., 2019</xref>). The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace># Min-Max Scaling</monospace>

                                    <monospace>scaler = MinMaxScaler() data_scaled = scaler.fit_transform(data)</monospace>
                                </preformat>
</p>
                        </list-item>
                    </list>
                </p>
                <p>
                    <list list-type="alpha-lower">
                        <list-item>
                            <label>d.</label>
                            <p>Standardization</p>
                            <p>Standardization, a common normalization technique, involves centering data around the mean and scaling it to have a unit standard deviation. This process is widely used in various fields. For instance, in image analysis, normalizing input data with mini-batch statistics enforces elements in feature maps to have a zero mean and unit standard deviation (
                                <xref ref-type="bibr" rid="ref32">Wu et al., 2020</xref>). The Python-formatted version of the code snippet for this technique is similar to:

                                <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                                    <monospace># Standardization</monospace>

                                    <monospace>scaler = StandardScaler()</monospace>

                                    <monospace>data_standardized = scaler.fit_transform(data)</monospace>
                                </preformat>
</p>
                        </list-item>
                    </list>
                </p>
            </sec>
            <sec id="sec5">
                <title>2.3 Fitting the quadratic model</title>
                <p>In Python, this was achieved using the 
                    <monospace>'Polynomial.fit'</monospace> method from the NumPy library, which computes the least-squares fit of a polynomial of specified degree to the given data. The snippet calculates the optimal values for coefficients 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>a</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>,</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>b</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>,</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>c</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> that minimize the sum of the squared differences between the observed values and values predicted by the polynomial, thereby effectively &#x201c;fitting&#x201d; the curve to the data, which Python-formatted version of code snippet similar to:

                    <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                        <styled-content style="color:#999988">
                            <italic toggle="yes">
                                <monospace># Fit the quadratic polynomial</monospace>
                            </italic>
                        </styled-content>
                        <monospace>coefs = Polynomial.fit(months, values, 
                            <styled-content style="color:#008080">2</styled-content>).convert().coef</monospace>
                    </preformat>
</p>
                <p>With the fitted polynomial, our script generates a curve across a continuum of points within the data range, which was visualized using Matplotlib&#x2019;s plotting function and the Python-formatted version of the code snippet similar to:

                    <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                        <styled-content style="color:#999988">
                            <italic toggle="yes">
                                <monospace># Generate a smooth curve by evaluating the polynomial at many points</monospace>
                            </italic>
                        </styled-content>
                        <monospace>x = np.linspace(months.min(), months.max(), 
                            <styled-content style="color:#008080">200</styled-content>)</monospace>

                        <monospace>y = coefs[
                            <styled-content style="color:#008080">0</styled-content>] + coefs[
                            <styled-content style="color:#008080">1</styled-content>] * x + coefs[
                            <styled-content style="color:#008080">2</styled-content>] * x**
                            <styled-content style="color:#008080">2</styled-content>
                        </monospace>


                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># Plot the data and the fitted curve</styled-content>
                            </monospace>
                        </italic>
                        <monospace>plt.plot(x, y, color=
                            <styled-content style="color:#DD1144">'purple'</styled-content>, label=
                            <styled-content style="color:#DD1144">'Fitted curve'</styled-content>)</monospace>
                    </preformat>
</p>
                <p>The coefficient of determination, 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:msup>
                                <mml:mi>R</mml:mi>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                        </mml:math>
                    </inline-formula>, was subsequently computed to assess the fit quality. Python was used to compare the variance of the residuals (the differences between the observed and predicted values) with the total variance of the data, and the corresponding code snippet is similar to:

                    <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># Calculate R-squared value</styled-content>
                            </monospace>
                        </italic>


                        <monospace># Predicted values from the polynomial</monospace>

                        <monospace>y_pred = coefs[0] + coefs[1] * months + coefs[2] * months**2</monospace>


                        <monospace># Residuals</monospace>

                        <monospace>residuals = values - y_pred</monospace>


                        <monospace># Sum of squares of residuals</monospace>

                        <monospace>ss_res = np.sum (residuals**2)</monospace>


                        <monospace># Total sum of squares</monospace>

                        <monospace>ss_tot = np.sum((values - np.mean (values))**2)</monospace>


                        <monospace># R-squared</monospace>

                        <monospace>r_squared = 1 - (ss_res/ss_tot)</monospace>
                    </preformat>
</p>
                <p>An 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>R</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> value close to one (1) suggests that the model explains a large portion of the variance in the response variable, indicating a strong fit. Conversely, a value near zero (0) suggests the model does not explain the variance well.</p>
            </sec>
            <sec id="sec6">
                <title>2.4 Implementation</title>
                <p>This section details the implementation of quadratic polynomial models in Python that are used in various applications, as demonstrated in this study. The core of the implementation involved the use of Python NumPy and Matplotlib libraries for mathematical operations and visualizations. The polynomial model is defined by the equation 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:msup>
                                <mml:mrow>
                                    <mml:mi>a</mml:mi>
                                    <mml:mi>x</mml:mi>
                                </mml:mrow>
                                <mml:mn>2</mml:mn>
                            </mml:msup>
                            <mml:mo>+</mml:mo>
                            <mml:mi mathvariant="italic">bx</mml:mi>
                            <mml:mo>+</mml:mo>
                            <mml:mi>c</mml:mi>
                        </mml:math>
                    </inline-formula>, where 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>a</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>,</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>b</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                            <mml:mo>,</mml:mo>
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:mi>c</mml:mi>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula>, are the coefficients optimized to fit the data points collected in different studies. The fitting process utilizes the 
                    <monospace>'Polynomial.fit'</monospace> method, which employs a least-squares polynomial fit. To ensure robustness and accuracy, the implementation also included calculation of the coefficient of determination 
                    <inline-formula>
                        <mml:math display="inline">
                            <mml:mrow>
                                <mml:mo stretchy="true">(</mml:mo>
                                <mml:msup>
                                    <mml:mi>R</mml:mi>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo stretchy="true">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </inline-formula> using NumPy&#x2019;s correlation function. This metric helps to assess the polynomial fit to the data, which is essential for the applications discussed, ranging from trend analysis in software usage to predicting the material properties of nanocomposites.</p>
                <p>In the next step, we used Python to present an applied exploration of quadratic polynomial fitting and the coefficient of determination (R-squared) within the context of data analysis.</p>
                <p>The following Python script is a practical implementation tool for researchers and analysts: It begins by prompting the user to describe the dataset, such as a location or a specific environmental metric, such as the PM2.5 air pollution index. This interactivity ensures that the resulting visualization is tailored and informative. The Python-formatted version of the code snippet of this part of our script is similar to:

                    <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># User inputs for the descriptive elements of the plot</styled-content>
                            </monospace>
                        </italic>
                        <monospace>description = input(
                            <styled-content style="color:#DD1144">"Enter the location description (e.g., Kyiv, Shcherbakovskaya St.):"</styled-content>)</monospace>

                        <monospace>pollution_name = input(
                            <styled-content style="color:#DD1144">"Enter the pollution name (e.g., PM2.5):"</styled-content>)</monospace>

                        <monospace>y_label = input(
                            <styled-content style="color:#DD1144">"Enter the y-axis label (e.g., PM2.5 Index):"</styled-content>)</monospace>
                    </preformat>
</p>
                <p>The script reads data from a CSV file using Pandas, a library that excels in data manipulation. The data consists of monthly observations of the chosen metric. You can see this implementation in the Python-formatted version of the code snippet similar to:

                    <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># Read data from a CSV file</styled-content>
                            </monospace>
                        </italic>
                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># Use the direct link to the raw CSV file from the GitHub repository</styled-content>
                            </monospace>
                        </italic>
                        <monospace>data = pd.read_csv(
                            <styled-content style="color:#DD1144">'</styled-content>
                            <ext-link ext-link-type="uri" xlink:href="https://raw.githubusercontent.com/rsipakov/QuadraticPolynomialsPyDA/main/notebooks/pm_data.csv">
                                <styled-content style="color:#DD1144">https://raw.githubusercontent.com/rsipakov/QuadraticPolynomialsPyDA/main/notebooks/pm_data.csv</styled-content>
                            </ext-link>
                            <styled-content style="color:#DD1144">'</styled-content>)</monospace>
                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># Or downloading CSV file to the local</styled-content>
                            </monospace>
                        </italic>
                        <italic toggle="yes">
                            <monospace>
                                <styled-content style="color:#999988"># data = pd.read_csv('/path/pm_data.csv') # Update the path to your CSV file</styled-content>
                            </monospace>
                        </italic>
                        <monospace>months = data[
                            <styled-content style="color:#DD1144">'Month'</styled-content>].to_numpy()</monospace>

                        <monospace>values = data[
                            <styled-content style="color:#DD1144">'Values'</styled-content>].to_numpy()</monospace>
                    </preformat>
</p>
                <p>As described above, with the data in hand, the NumPy library&#x2019;s 
                    <monospace>'Polynomial.fit'</monospace> function is employed to fit a quadratic polynomial to these observations. This is an essential step in modeling nonlinear behavior, accommodating potential fluctuations in data that a simple linear model would miss. Subsequently, the script computes the fitted values and leverages them to calculate the R-squared values. This statistic conveys the proportion of variance in the dependent variable explained by the independent variable. The Matplotlib library was then used to graphically represent the data along with the fitted curve, visually comparing the actual data points with those of the predictive model.</p>
                <p>The following sources (
                    <xref ref-type="bibr" rid="ref9">VanderPlas, 2016</xref>; 
                    <xref ref-type="bibr" rid="ref10">McKinney, 2017</xref>) provide a comprehensive overview of Python&#x2019;s theoretical background and practical application. These resources offer a deep dive into data analysis using Python, including comprehensive guidance on regression analysis, and robust examples that bridge theory with practice.</p>
            </sec>
            <sec id="sec7">
                <title>2.5 R-squared limitations</title>
                <p>R-squared is a commonly used metric for assessing the goodness of fit of regression models. However, it has notable limitations that must be taken into account when evaluating model performance. One key limitation is its sensitivity to the number of predictors in the model. As more predictors are added, R-squared will invariably increase, even if these additional predictors are not truly relevant to the model. This phenomenon can lead to overfitting, where the model captures noise rather than the actual relationship in the data (
                    <xref ref-type="bibr" rid="ref33">Fox &amp; Weisberg, 2018</xref>).</p>
                <p>To enhance the evaluation of regression models and address limitations such as overfitting, researchers can utilize a combination of metrics beyond the traditional R-squared. Adjusted R-squared is recommended as it considers the number of predictors in the model, offering a more balanced assessment that considers model complexity and penalizes the inclusion of irrelevant predictors (
                    <xref ref-type="bibr" rid="ref34">Ajjaj et al., 2022</xref>). This adjustment helps prevent overfitting, ensuring that the model captures the underlying data patterns effectively. Additionally, Mean Squared Error (MSE) and Root Mean Squared Error (RMSE) are valuable metrics for assessing prediction accuracy by quantifying the average squared differences between observed and predicted values (
                    <xref ref-type="bibr" rid="ref35">Chicco et al., 2021</xref>). These metrics are particularly useful for comparing different models and providing an intuitive measure of prediction error.</p>
                <p>To implement additional metrics like Adjusted R-squared, Mean Squared Error (MSE), and Root Mean Squared Error (RMSE) in our code, we provide below the Python-formatted version of the code snippet, similar to:

                    <preformat orientation="portrait" position="float" preformat-type="computer code" xml:space="preserve">
                        <monospace># Calculate Adjusted R-squared value</monospace>

                        <monospace>n = len (values_scaled) # number of data points</monospace>

                        <monospace>p = 2 # number of predictors (polynomial degree)</monospace>

                        <monospace>adjusted_r_squared = 1 - ((1 - r_squared) * (n - 1) / (n - p - 1))</monospace>


                        <monospace># Calculate Mean Squared Error (MSE) and Root Mean Squared Error (RMSE)</monospace>

                        <monospace>mse = mean_squared_error(values_scaled, fitted_y_values)</monospace>

                        <monospace>rmse = np.sqrt (mse)</monospace>
                    </preformat>
</p>
            </sec>
            <sec id="sec8">
                <title>2.6 Operation</title>
                <p>The software tool based on quadratic polynomial models requires the following system setup and workflow: Operating System&#x2014;Windows, macOS, or Linux; Python Version&#x2014;Python 3.6 or later; dependencies &#x2014;NumPy, Matplotlib, Pandas, scikit-learn (the latest versions are recommended), memory, at least 4GB of RAM; Processor, minimum 1GHz processor, or faster. The software is accessible through MyBinder.org, requires no local installation, and is fully configured to run in any web browser, ensuring its ease of use and reproducibility.</p>
            </sec>
            <sec id="sec9">
                <title>2.7 Installation process</title>
                <p>To begin the installation process, it is imperative to ensure that Python is installed in the operating system. If Python is not present, it can be acquired from Python&#x2019;s official website python.org. After successful installation of Python, the next step involved installing the necessary libraries. This can be achieved through the Python Package Index (PyPI) using a PIP installer. Execute the following command in the command prompt or terminal to install the required libraries: 
                    <monospace>'pip install numpy pandas matplotlib scikit-learn'</monospace>. This command installs NumPy, which is essential for numerical computations, Matplotlib, a library for plotting graphs and effectively visualizing the data, Pandas, a data manipulation and analysis library, and scikit-learn is a widely used tool in the field of machine learning.</p>
                <p>After developing the script using the quadratic polynomial models described above, the complete Python code was hosted on GitHub (
                    <xref ref-type="bibr" rid="ref11">Sipakov, 2024</xref>), enabling replication and further exploration of the findings. To facilitate ease of use and accessibility, the code was made available through 
                    <ext-link ext-link-type="uri" xlink:href="http://MyBinder.org">MyBinder.org</ext-link> (
                    <ext-link ext-link-type="uri" xlink:href="https://mybinder.org/v2/gh/rsipakov/QuadraticPolynomialsPyDA/main">https://mybinder.org/v2/gh/rsipakov/QuadraticPolynomialsPyDA/main</ext-link>), allowing it to operate in a live environment without the need for local setup. This implementation ensures that other researchers can directly interact with the codebase, providing a dynamic way to validate and extend research findings.</p>
            </sec>
        </sec>
        <sec id="sec10" sec-type="results">
            <title>3. Results</title>
            <p>The quadratic polynomial fitting method used in this study demonstrates Python's ability to effectively manage and analyze complex datasets. The datasets used herein are illustratively generated, serving as a basis for demonstrating the potential applications of quadratic polynomial models. The fitting process provided a smooth curve aligned closely with the observed data points, indicating robust model performance. Notably, the computed coefficient of determination, R-squared 
                <inline-formula>
                    <mml:math display="inline">
                        <mml:mrow>
                            <mml:mo stretchy="true">(</mml:mo>
                            <mml:msup>
                                <mml:mi>R</mml:mi>
                                <mml:mo>&#x00b2;</mml:mo>
                            </mml:msup>
                            <mml:mo stretchy="true">)</mml:mo>
                        </mml:mrow>
                        <mml:mo>,</mml:mo>
                    </mml:math>
                </inline-formula> was substantially high, reflecting a strong correlation between the observed values and those predicted by the model. This statistical measure underpins the polynomial's ability to capture and explain variability in the data effectively, which is crucial for validating the regression model used in this analysis. 
                <xref ref-type="fig" rid="f2">Figure 2</xref> illustrates the quadratic polynomial curve fitted to the observed data points using Python's plotting library Matplotlib.</p>
            <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                <label>Figure 2. </label>
                <caption>
                    <title>Quadratic polynomial fit of dataset.</title>
                </caption>
                <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/169942/7b98933b-927e-4eb2-b174-a59720c471f8_figure2.gif"/>
            </fig>
            <p>The curve represents the model obtained from regression analysis, where the quadratic polynomial provides a significant fit to the data, as evidenced by the computed R-squared value. The axes were labeled to identify the independent variable (x-axis) and dependent variable (y-axis), and a legend was included to differentiate between the observed data points and fitted polynomial curve. The smoothness of the curve indicates the effectiveness of the model in capturing trends within the dataset, which can be utilized for predictive analytics and further statistical inferences. After configuring the plot with the necessary parameters for clear and informative visualization, it was generated using the 
                <monospace>'plt. show()'</monospace> function in Matplotlib.</p>
            <p>To provide a broader perspective on quadratic models' performance, we compared them with linear and cubic models using the same datasets, and the results as shown in 
                <xref ref-type="fig" rid="f3">Figure 3</xref>. This comparison utilized three key metrics: R-squared, Adjusted R-squared, and Mean Squared Error (MSE) to assess the fit and predictive accuracy. We used Python to fit linear, quadratic, and cubic models to the datasets and calculate the aforementioned metrics. The results of the model fitting are summarized in 
                <xref ref-type="table" rid="T1">Table 1</xref>.</p>
            <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                <label>Figure 3. </label>
                <caption>
                    <title>Quadratic polynomial fit of dataset.</title>
                    <p>Comparing quadratic, linear and cubic models using the same datasets.</p>
                </caption>
                <graphic id="gr3" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/169942/7b98933b-927e-4eb2-b174-a59720c471f8_figure3.gif"/>
            </fig>
            <table-wrap id="T1" orientation="portrait" position="float">
                <label>Table 1. </label>
                <caption>
                    <title>Comparing quadratic, linear and cubic models using the same datasets.</title>
                </caption>
                <table content-type="article-table" frame="hsides">
                    <thead>
                        <tr>
                            <th align="left" colspan="1" rowspan="1" valign="top">Model</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">R-squared</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Adjusted R-squared</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">MSE</th>
                        </tr>
                    </thead>
                    <tbody>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Linear</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.0173</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">-0.0810</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.9827</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Quadratic</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.7805</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.7318</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.2195</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Cubic</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.8737</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.8263</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.1263</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
            <p>The linear model shows a very poor fit with an R-squared value of 0.0173, indicating that it barely explains the variance in the data. The negative Adjusted R-squared suggests that the model is not suitable for this dataset. The quadratic model significantly improves the fit, with an R-squared value of 0.7805 and an Adjusted R-squared of 0.7318, indicating a much better fit compared to the linear model. The MSE is also substantially lower. The cubic model provides the best fit among the three, with the highest R-squared value of 0.8737 and Adjusted R-squared of 0.8263, along with the lowest MSE, indicating that it explains the variance in the data the most effectively.</p>
            <p>The selection between quadratic and cubic models should account for the intricacy of the dataset and the potential for overfitting. The quadratic model often strikes an optimal balance between simplicity and precision, making it preferable for numerous practical applications. The quadratic model's ability to effectively capture the essential patterns in the data without the risk of overfitting associated with higher-degree polynomials underscores its utility and robustness in empirical research and applied data analysis.</p>
        </sec>
        <sec id="sec11" sec-type="discussion">
            <title>4. Discussion</title>
            <p>Quadratic polynomials are valued for their ability to model nonlinear relationships in various data contexts, balancing computational efficiency, and interpretability. However, their performance can be limited when confronted with complex multivariable systems in which more sophisticated statistical models may be more accurate. Future research could address these challenges by focusing on several advancements in quadratic polynomial modeling. Incorporating regularization techniques is recommended to counteract overfitting, particularly for datasets with intricate structures. Exploring hybrid models that merge the clear interpretive benefits of quadratic polynomials with the robust capabilities of machine learning algorithms could also enhance predictive accuracy.</p>
            <p>Moreover, the development of adaptive polynomial models that adjust their parameters based on real-time data inputs can significantly improve the dynamic data analysis. Extending these models to operate within multiscale frameworks may offer deeper insights into various levels of data structure, ensuring a comprehensive understanding of complex patterns. These enhancements are crucial for extending the utility of quadratic polynomials beyond their current capabilities and facilitating more accurate and efficient statistical analyses across diverse datasets.</p>
            <p>This study acknowledges that the effectiveness of quadratic polynomials, like any statistical model, is contingent on the quality and volume of the data available. To mitigate potential biases and inaccuracies in the input data, the data collection methodology should include rigorous data preprocessing steps, such as outlier removal, normalization, and feature selection, which are crucial for enhancing the reliability of the research. Despite the potential of more advanced models, this study primarily advocates quadratic polynomials because of their suitability for datasets exhibiting quadratic relationships, which are frequently encountered in environment-related target research. However, future research should continue to explore the comparative dynamic performance of quadratic polynomials, for example, the performance of benchmarking against contemporary machine-learning algorithms to ensure a comprehensive understanding of their relative merits, possibly extending the use of hybrid approaches that combine the strengths of traditional polynomial models and cutting-edge machine-learning techniques.</p>
            <p>While quadratic models offer simplicity and clarity, they may only capture part of the complexity of data as effectively as some machine-learning models. However, their computational efficiency and suitability for smaller datasets can be advantageous for specific scenarios.</p>
            <p>
                <bold>Challenges and limitations of quadratic polynomials</bold>
            </p>
            <p>Quadratic polynomials can effectively model nonlinear relationships, but they are prone to overfitting, particularly with small or noisy datasets. Overfitting occurs when the model becomes too complex and captures the noise in the data rather than the underlying trend. This results in poor generalization to new data.</p>
            <p>When the dataset is small, the quadratic model might fit the few available data points too closely, capturing random variations rather than the actual trend. In datasets with a high level of noise, a quadratic polynomial might try to model these fluctuations, leading to overfitting.</p>
            <p>Techniques such as Ridge Regression (L2 regularization) or Lasso Regression (L1 regularization) can penalize the complexity of the model, discouraging overfitting. Using cross-validation methods, such as k-fold cross-validation, helps in assessing the model's performance on different subsets of the data, ensuring it generalizes well to unseen data. Sometimes, a linear model might suffice if the relationship is not strongly nonlinear. Alternatively, we can consider higher-order polynomials only if there is a clear justification from the data.</p>
            <p>Quadratic models are sensitive to variability in the data, which can significantly affect their performance. Small changes in the data can lead to substantial changes in the fitted model, impacting its stability and predictive power. Properly preprocessing the data by removing outliers and handling missing values can improve model stability. Implementing robust statistical techniques to detect and handle anomalies can mitigate the sensitivity of the model to data variability. Combining multiple models (e.g., through bagging or boosting) can reduce the impact of variability and enhance predictive performance.</p>
            <p>
                <bold>When regularization and cross-validation are needed</bold>
            </p>
            <p>Unfortunately, 
                <monospace>'Polynomial.fit'</monospace> itself does not support regularization directly, so we need to mimic regularization and cross-validation manually. However, the use of 
                <monospace>'Polynomial.fit'</monospace> from the NumPy library for fitting a polynomial to data has its advantages, particularly for straightforward polynomial regression without the need for additional regularization or cross-validation. The syntax is simple and easy to understand, making the code more readable. 
                <monospace>'Polynomial.fit'</monospace> directly provides the coefficients of the fitted polynomial, which can be easily accessed and interpreted. For small to moderate-sized datasets, 
                <monospace>'Polynomial.fit'</monospace> is computationally efficient. It uses least-squares fitting, which is optimal for such scenarios without the overhead of more complex methods. This can be particularly useful when the primary goal is to quickly fit and visualize a polynomial model.</p>
            <p>While 
                <monospace>'Polynomial.fit'</monospace> has these advantages, there are situations where more complex techniques like regularization and cross-validation become necessary. 
                <monospace>'Polynomial.fit'</monospace> is excellent for simplicity, quick fitting, and visualization. Ridge regression with cross-validation offers more robust performance evaluation and overfitting prevention for complex scenarios.</p>
        </sec>
        <sec id="sec12" sec-type="conclusion">
            <title>5. Conclusion</title>
            <p>In this study, we demonstrate the practical utility and versatility of quadratic polynomials for advanced data analysis in Python. We showcase how quadratic models can effectively capture nonlinear relationships in complex datasets by leveraging the capabilities of Python libraries such as NumPy, Matplotlib, scikit-learn, and Pandas.</p>
            <p>The results highlight the strong performance of the quadratic polynomial fit, as evidenced by the high coefficient of determination (R-squared) value. This indicates that the model explains a substantial proportion of the variability in the data. Comparisons with linear and cubic models further underscore the quadratic model's ability to strike an optimal balance between simplicity and precision for many practical applications.</p>
            <p>However, our study also acknowledges quadratic polynomials' limitations, such as their susceptibility to overfitting with small or noisy datasets and their sensitivity to data variability. Techniques like regularization and cross-validation are recommended to mitigate these challenges and ensure robust model performance.</p>
            <p>Future research directions are proposed, including the incorporation of regularization methods, exploration of hybrid models combining quadratic polynomials with machine learning algorithms, development of adaptive polynomial models, and extension to multiscale frameworks. These advancements can further enhance the accuracy and efficiency of quadratic polynomial models for diverse data analysis tasks.</p>
        </sec>
        <sec id="sec13">
            <title>Ethical compliance</title>
            <p>All procedures involving human participants were performed in accordance with the ethical standards of the Institutional and National Research Committee.</p>
        </sec>
        <sec id="sec14">
            <title>Author contributions</title>
            <p>Rostyslav Sipakov contributed to the research design, implementation, and manuscript writing. Dr. Voloshkina and Dr. Kovalova helped implement and analyze the results. All authors have seen and agreed to the final content of the manuscript.</p>
        </sec>
    </body>
    <back>
        <sec id="sec15" sec-type="data-availability">
            <title>Data availability statement</title>
            <p>No data is associated with this article.</p>
        </sec>
        <sec id="sec16">
            <title>Software availability statement</title>
            <p>

                <list list-type="bullet">
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Source code of the scripts available from: 
                            <ext-link ext-link-type="uri" xlink:href="https://github.com/rsipakov/QuadraticPolynomialsPyDA">https://github.com/rsipakov/QuadraticPolynomialsPyDA</ext-link>
                        </p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>Archived scripts available from: 
                            <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.10637508">https://doi.org/10.5281/zenodo.10637508</ext-link>
                        </p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>License: OSI approved open license software is under MIT License (
                            <ext-link ext-link-type="uri" xlink:href="https://opensource.org/license/MIT">https://opensource.org/license/MIT</ext-link>)</p>
                    </list-item>
                </list>
            </p>
        </sec>
        <ref-list>
            <title>References</title>
            <ref id="ref34">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ajjaj</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Houssaini</surname>
                            <given-names>SE</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hain</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Performance assessment and modeling of routing protocol in vehicular ad hoc networks using statistical design of experiments methodology: a comprehensive study.</article-title>
                    <source>

                        <italic toggle="yes">Appl. Syst. Innov.</italic>
</source>
                    <year>2022</year>;<volume>5</volume>(<issue>1</issue>):<fpage>19</fpage>.
                    <pub-id pub-id-type="doi">10.3390/asi5010019</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Aladesanmi</surname>
                            <given-names>VI</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Fatoba</surname>
                            <given-names>OS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jen</surname>
                            <given-names>TC</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Python Data Analysis and Regression Plots of Wear and Hardness Characteristics of Laser Cladded Ti and TiB2 Nanocomposites on Steel Rail.</article-title>
                    <source>

                        <italic toggle="yes">2021 IEEE 12th International Conference on Mechanical and Intelligent Manufacturing Technologies (ICMIMT).</italic>
</source>
                    <year>2021</year>; pp.<fpage>40</fpage>&#x2013;<lpage>44</lpage>.
                    <pub-id pub-id-type="doi">10.1109/icmimt52186.2021.9476211</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Alexander</surname>
                            <given-names>WM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ficarro</surname>
                            <given-names>SB</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Adelmant</surname>
                            <given-names>G</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>multiplierzv2.0: a python-based ecosystem for shared access and analysis of native mass spectrometry data.</article-title>
                    <source>

                        <italic toggle="yes">Proteomics.</italic>
</source>
                    <year>2017</year>;<volume>17</volume>(<issue>15-16</issue>):<fpage>1700091</fpage>.
                    <pub-id pub-id-type="pmid">28686798</pub-id>
                    <pub-id pub-id-type="doi">10.1002/pmic.201700091</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref30">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ampomah</surname>
                            <given-names>EK</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nyame</surname>
                            <given-names>G</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Qin</surname>
                            <given-names>Z</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Stock market prediction with gaussian na&#x00ef;ve bayes machine learning algorithm.</article-title>
                    <source>

                        <italic toggle="yes">Informatica.</italic>
</source>
                    <year>2021</year>;<volume>45</volume>(<issue>2</issue>).
                    <pub-id pub-id-type="doi">https://doi.org/10.31449/inf.v45i2.3407</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref13">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Chang</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Huh</surname>
                            <given-names>U</given-names>
                        </name>
</person-group>:
                    <article-title>Curvature-continuous 3d path-planning using qpmi method.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Adv. Robot. Syst.</italic>
</source>
                    <year>2015</year>;<volume>12</volume>(<issue>6</issue>):<fpage>76</fpage>.
                    <pub-id pub-id-type="doi">10.5772/60718</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref35">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Chicco</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Warrens</surname>
                            <given-names>MJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jurman</surname>
                            <given-names>G</given-names>
                        </name>
</person-group>:
                    <article-title>The coefficient of determination r-squared is more informative than smape, mae, mape, mse and rmse in regression analysis evaluation.</article-title>
                    <source>

                        <italic toggle="yes">PeerJ. Comput. Sci.</italic>
</source>
                    <year>2021</year>;<volume>7</volume>:<fpage>e623</fpage>.
                    <pub-id pub-id-type="pmid">34307865</pub-id>
                    <pub-id pub-id-type="doi">10.7717/peerj-cs.623</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8279135</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref28">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>&#x00c7;ILGIN</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>G&#x00f6;k&#x015f;en</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>G&#x00f6;k&#x00e7;en</surname>
                            <given-names>H</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The effect of outlier detection methods in real estate valuation with machine learning.</article-title>
                    <source>

                        <italic toggle="yes">&#x0130;zmir Sosyal Bilimler Dergisi.</italic>
</source>
                    <year>2023</year>;<volume>5</volume>(<issue>1</issue>):<fpage>9</fpage>&#x2013;<lpage>20</lpage>.
                    <pub-id pub-id-type="doi">https://doi.org/10.47899/ijss.1270433</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref29">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Cui</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gong</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bai</surname>
                            <given-names>Y</given-names>
                        </name>
</person-group>:
                    <article-title>Performance assessment of icesat-2 laser altimeter data for water-level measurement over lakes and reservoirs in china.</article-title>
                    <source>

                        <italic toggle="yes">Remote Sensing.</italic>
</source>
                    <year>2020</year>;<volume>12</volume>(<issue>5</issue>):<fpage>770</fpage>.
                    <pub-id pub-id-type="doi">10.3390/rs12050770</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref7">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Draper</surname>
                            <given-names>NR</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Smith</surname>
                            <given-names>H</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Applied Regression Analysis.</italic>
</source>
                    <edition>3rd ed.</edition>
                    <publisher-loc>New York</publisher-loc>:
                    <publisher-name>John Wiley</publisher-name>;<year>2014</year>.
                    <isbn>978-1-118-62568-2</isbn>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.wiley.com/en-us/Applied+Regression+Analysis%2C+3rd+Edition-p-9781118625682">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref21">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Dubey</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Rasool</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Efficient technique of microarray missing data imputation using clustering and weighted nearest neighbour.</article-title>
                    <source>

                        <italic toggle="yes">Sci. Rep.</italic>
</source>
                    <year>2021</year>;<volume>11</volume>(<issue>1</issue>):<fpage>24297</fpage>.
                    <pub-id pub-id-type="pmid">34934107</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41598-021-03438-x</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8692342</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref23">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Fan</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Za&#x00ef;ane</surname>
                            <given-names>OR</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Foss</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A nonparametric outlier detection for effectively discovering top-n outliers from engineering data.</article-title>
                    <source>

                        <italic toggle="yes">Advances in Knowledge Discovery and Data Mining.</italic>
</source>
                    <year>2006</year>;<fpage>557</fpage>&#x2013;<lpage>566</lpage>.
                    <pub-id pub-id-type="doi">10.1007/11731139_66</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref17">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Fleck</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>K&#x00fc;gel</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kommenda</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>Understanding and preparing data of industrial processes for machine learning applications.</article-title>
                    <source>

                        <italic toggle="yes">Computer Aided Systems Theory &#x2013; EUROCAST.</italic>
</source>
                    <year>2019</year>;<volume>12013</volume>:<fpage>413</fpage>&#x2013;<lpage>420</lpage>.
                    <pub-id pub-id-type="doi">https://doi.org/10.1007/978-3-030-45093-9_50</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref33">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Fox</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Weisberg</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>Visualizing fit and lack of fit in complex regression models with predictor effect plots and partial residuals.</article-title>
                    <source>

                        <italic toggle="yes">J. Stat. Softw.</italic>
</source>
                    <year>2018</year>;<volume>87</volume>(<issue>9</issue>).
                    <pub-id pub-id-type="doi">https://doi.org/10.18637/jss.v087.i09</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref14">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Fuchs</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gruber</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Reitmaier</surname>
                            <given-names>T</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Processing short-term and long-term information with a combination of polynomial approximation techniques and time-delay neural networks.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Trans. Neural Netw.</italic>
</source>
                    <year>2009</year>;<volume>20</volume>(<issue>9</issue>):<fpage>1450</fpage>&#x2013;<lpage>1462</lpage>.
                    <pub-id pub-id-type="pmid">19628457</pub-id>
                    <pub-id pub-id-type="doi">10.1109/tnn.2009.2024679</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref31">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gertz</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gertz</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Matth&#x00e4;us</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Willenberg</surname>
                            <given-names>I</given-names>
                        </name>
</person-group>:
                    <article-title>A systematic chemometric approach to identify the geographical origin of olive oils.</article-title>
                    <source>

                        <italic toggle="yes">Eur. J. Lipid Sci. Technol.</italic>
</source>
                    <year>2019</year>;<volume>121</volume>(<issue>12</issue>).
                    <pub-id pub-id-type="doi">10.1002/ejlt.201900281</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref15">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gibert</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mor&#x00e9;teau</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>David</surname>
                            <given-names>JR</given-names>
                        </name>
</person-group>:
                    <article-title>Developmental constraints on an adaptive plasticity: reaction norms of pigmentation in adult segments of drosophila melanogaster.</article-title>
                    <source>

                        <italic toggle="yes">Evol. Dev.</italic>
</source>
                    <year>2000</year>;<volume>2</volume>(<issue>5</issue>):<fpage>249</fpage>&#x2013;<lpage>260</lpage>.
                    <pub-id pub-id-type="pmid">11252554</pub-id>
                    <pub-id pub-id-type="doi">10.1046/j.1525-142x.2000.00064.x</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref1">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gong</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>P</given-names>
                        </name>
</person-group>:
                    <article-title>Predictive Analysis and Research Of Python Usage Rate Based on Polynomial Regression Model.</article-title>
                    <source>

                        <italic toggle="yes">2021 3rd International Conference on Artificial Intelligence and Advanced Manufacture (AIAM).</italic>
</source>
                    <year>2021</year>; pp.<fpage>266</fpage>&#x2013;<lpage>270</lpage>.
                    <pub-id pub-id-type="doi">10.1109/aiam54119.2021.00061</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kaliukh</surname>
                            <given-names>I</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Voloshkina</surname>
                            <given-names>O</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Efimenko</surname>
                            <given-names>V</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Modern Technologies of Internet of Things in the Restrained Urban Development for Complicated Ground Conditions.</article-title>
                    <source>

                        <italic toggle="yes">16th International Conference Monitoring of Geological Processes and Ecological Condition of the Environment.</italic>
</source>
                    <year>2022</year>; pp.<fpage>1</fpage>&#x2013;<lpage>5</lpage>.
                    <pub-id pub-id-type="doi">10.3997/2214-4609.2022580086</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref19">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Karrar</surname>
                            <given-names>AE</given-names>
                        </name>
</person-group>:
                    <article-title>The effect of using data pre-processing by imputations in handling missing values.</article-title>
                    <source>

                        <italic toggle="yes">Indonesian Journal of Electrical Engineering and Informatics (IJEEI).</italic>
</source>
                    <year>2022</year>;<volume>10</volume>(<issue>2</issue>)
                    <pub-id pub-id-type="doi">https://doi.org/10.52549/ijeei.v10i2.3730</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref12">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Koivisto</surname>
                            <given-names>TS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hohmann</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Z&#x0142;o&#x015b;nik</surname>
                            <given-names>T</given-names>
                        </name>
</person-group>:
                    <article-title>The general linear cartan khronon.</article-title>
                    <source>

                        <italic toggle="yes">Universe.</italic>
</source>
                    <year>2019</year>;<volume>5</volume>(<issue>7</issue>):<fpage>168</fpage>.
                    <pub-id pub-id-type="doi">10.3390/universe5070168</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref25">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Latecki</surname>
                            <given-names>LJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lazarevi&#x0107;</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Pokrajac</surname>
                            <given-names>D</given-names>
                        </name>
</person-group>:
                    <article-title>Outlier detection with kernel density functions.</article-title>
                    <source>

                        <italic toggle="yes">Machine Learning and Data Mining in Pattern Recognition.</italic>
</source>
                    <year>2007</year>;<fpage>61</fpage>&#x2013;<lpage>75</lpage>.
                    <pub-id pub-id-type="doi">10.1007/978-3-540-73499-4_6</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref20">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>CH</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tsai</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sue</surname>
                            <given-names>KL</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The feature selection effect on missing value imputation of medical datasets.</article-title>
                    <source>

                        <italic toggle="yes">Appl. Sci.</italic>
</source>
                    <year>2020</year>;<volume>10</volume>(<issue>7</issue>):<fpage>2344</fpage>.
                    <pub-id pub-id-type="doi">10.3390/app10072344</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref10">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>McKinney</surname>
                            <given-names>W</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Python for Data Analysis.</italic>
</source>
                    <edition>2nd ed.</edition>
                    <publisher-name>O'Reilly Media, Inc.</publisher-name>;<year>2017</year>.
                    <isbn>9781491957660</isbn>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.oreilly.com/library/view/python-for-data/9781491957653/">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref8">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Montgomery</surname>
                            <given-names>DC</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Peck</surname>
                            <given-names>EA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Geoffrey Vining</surname>
                            <given-names>G</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Introduction to Linear Regression Analysis.</italic>
</source>
                    <edition>6th ed.</edition>
                    <publisher-loc>New York</publisher-loc>:
                    <publisher-name>John Wiley</publisher-name>;<year>2021</year>.
                    <isbn>978-1-119-57875-8</isbn>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.wiley.com/en-us/Introduction+to+Linear+Regression+Analysis%2C+6th+Edition-p-9781119578758">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref11">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sipakov</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <article-title>rsipakov/QuadraticPolynomialsPyDA: Utilizing quadratic polynomials within Python to conduct sophisticated data analysis. (v0.0.1).</article-title>
                    <source>

                        <italic toggle="yes">Zenodo.</italic>
</source>
                    <year>2024</year>.
                    <pub-id pub-id-type="doi">10.5281/zenodo.10637508</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref22">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sipakov</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Trofimovich</surname>
                            <given-names>V</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Voloshkina</surname>
                            <given-names>O</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Assessment and forecast for the creation of photochemical smog over transport overpasses in Kyiv.</article-title>
                    <source>

                        <italic toggle="yes">Environ. Safety Nat. Resour.</italic>
</source>
                    <year>2018</year>;<volume>25</volume>(<issue>1</issue>):<fpage>44</fpage>&#x2013;<lpage>51</lpage>.
                    <pub-id pub-id-type="doi">https://doi.org/10.32347/2411-4049.2018.1.44-51</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref18">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Suh</surname>
                            <given-names>HK</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Song</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <article-title>A comparison of imputation methods using machine learning models.</article-title>
                    <source>

                        <italic toggle="yes">Commun. Stat. Appl. Methods.</italic>
</source>
                    <year>2023</year>;<volume>30</volume>(<issue>3</issue>):<fpage>331</fpage>&#x2013;<lpage>341</lpage>.
                    <pub-id pub-id-type="doi">https://doi.org/10.29220/csam.2023.30.3.331</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref24">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Toshiaki</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Yu</surname>
                            <given-names>I</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Duy</surname>
                            <given-names>VNL</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Conditional selective inference for robust regression and outlier detection using piecewise-linear homotopy continuation.</article-title>
                    <year>2021</year>.
                    <pub-id pub-id-type="doi">https://doi.org/10.48550/arxiv.2104.10840</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref9">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>VanderPlas</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Python Data Science Handbook.</italic>
</source>
                    <publisher-name>O'Reilly Media, Inc.</publisher-name>;<year>2016</year>.
                    <isbn>9781491912058</isbn>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.oreilly.com/library/view/python-data-science/9781491912126/">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref16">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Voloshkina</surname>
                            <given-names>O</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tkachenko</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sipakov</surname>
                            <given-names>R</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The estimation and reduction of risks caused by air pollution in cities.</article-title>
                    <source>

                        <italic toggle="yes">Budownictwo O Zoptymalizowanym Potencjale Energetycznym.</italic>
</source>
                    <year>2019</year>;<volume>8</volume>:<fpage>17</fpage>&#x2013;<lpage>25</lpage>.
                    <pub-id pub-id-type="doi">10.17512/bozpe.2019.2.02</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sun</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gao</surname>
                            <given-names>Q</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Slag material's proportion optimised by polynomial regression.</article-title>
                    <source>

                        <italic toggle="yes">Proceedings of the Institution of Civil Engineers - Construction Materials.</italic>
</source>
                    <year>2014</year>;<volume>167</volume>(<issue>1</issue>):<fpage>8</fpage>&#x2013;<lpage>13</lpage>.
                    <pub-id pub-id-type="doi">10.1680/coma.12.00003</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref32">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wu</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhong</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>Y</given-names>
                        </name>
</person-group>:
                    <article-title>A novel convolutional neural network for image steganalysis with shared normalization.</article-title>
                    <source>

                        <italic toggle="yes"> IEEE Trans. Multimedia.</italic>
</source>
                    <year>2020</year>;<volume>22</volume>(<issue>1</issue>):<fpage>256</fpage>&#x2013;<lpage>270</lpage>.
                    <pub-id pub-id-type="doi">10.1109/tmm.2019.2920605</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref5">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Yadav</surname>
                            <given-names>RS</given-names>
                        </name>
</person-group>:
                    <article-title>Data analysis of COVID-2019 epidemic using machine learning methods: a case study of India.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Inf. Technol.</italic>
</source>
                    <year>2020</year>;<volume>12</volume>(<issue>4</issue>):<fpage>1321</fpage>&#x2013;<lpage>1330</lpage>.
                    <pub-id pub-id-type="pmid">32838124</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s41870-020-00484-y</pub-id>
                    <pub-id pub-id-type="pmcid">PMC7250543</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref27">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Yaro</surname>
                            <given-names>AS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Maly</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Prazak</surname>
                            <given-names>P</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Outlier detection performance of a modified z-score method in time-series rss observation with hybrid scale estimators.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Access.</italic>
</source>
                    <year>2024</year>;<volume>12</volume>:<fpage>12785</fpage>&#x2013;<lpage>12796</lpage>.
                    <pub-id pub-id-type="doi">10.1109/access.2024.3356731</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref26">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Yerlikaya-&#x00d6;zkurt</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Askan</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Weber</surname>
                            <given-names>G</given-names>
                        </name>
</person-group>:
                    <article-title>A hybrid computational method based on convex optimization for outlier problems: application to earthquake ground motion prediction.</article-title>
                    <source>

                        <italic toggle="yes">Informatica.</italic>
</source>
                    <year>2016</year>;<volume>27</volume>(<issue>4</issue>):<fpage>893</fpage>&#x2013;<lpage>910</lpage>.
                    <pub-id pub-id-type="doi">https://doi.org/10.15388/informatica.2016.116</pub-id>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report315474">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.169942.r315474</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Wang</surname>
                        <given-names>Qiao</given-names>
                    </name>
                    <xref ref-type="aff" rid="r315474a1">1</xref>
                    <xref ref-type="aff" rid="r315474a2">2</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-5271-0472</uri>
                </contrib>
                <aff id="r315474a1">
                    <label>1</label>Southeast University, Nanjing,, China</aff>
                <aff id="r315474a2">
                    <label>2</label>School of Economics and Management, Southeast University, Nanjing, China</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>4</day>
                <month>9</month>
                <year>2024</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2024 Wang Q</copyright-statement>
                <copyright-year>2024</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport315474" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.149391.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The quadratic polynomial is a fundamental modeling technique in data analysis, particularly because any smooth function can be approximated by a quadratic polynomial at a fixed point using a second-order Taylor expansion. This makes it a valuable concept for experts and researchers in the medical field to understand.&#x00a0;</p>
            <p> </p>
            <p> This revised version partially addressed my concerns in my initial review. However, it still avoids the more usual contents concerning multivariate model.</p>
            <p>Are the conclusions about the tool and its performance adequately supported by the findings presented in the article?</p>
            <p>Partly</p>
            <p>Is the rationale for developing the new software tool clearly explained?</p>
            <p>No</p>
            <p>Is the description of the software tool technically sound?</p>
            <p>No</p>
            <p>Are sufficient details of the code, methods and analysis (if applicable) provided to allow replication of the software development and its use by others?</p>
            <p>No</p>
            <p>Is sufficient information provided to allow interpretation of the expected output datasets and any results generated using the tool?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Data analytics</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report315475">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.169942.r315475</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Molla</surname>
                        <given-names>Selim</given-names>
                    </name>
                    <xref ref-type="aff" rid="r315475a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0009-0007-2969-2791</uri>
                </contrib>
                <aff id="r315475a1">
                    <label>1</label>The University of Texas at El Paso, El Paso, Texas, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>3</day>
                <month>9</month>
                <year>2024</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2024 Molla S</copyright-statement>
                <copyright-year>2024</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport315475" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.149391.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>
                <bold>Overall Assessment:</bold> The article&#x00a0;
                <italic>"Leveraging Quadratic Polynomials in Python for Advanced Data Analysis"</italic> is well-constructed and provides a valuable tool for researchers seeking to apply quadratic polynomials using Python. The authors have successfully demonstrated the tool's capability to model nonlinear relationships in data, offering practical guidance and sufficient details for replication. The work is technically sound and offers a clear rationale for the development of the software tool.</p>
            <p> </p>
            <p> 
                <bold>Recommendation for Multivariable Analysis:</bold> While the article is a strong contribution, I recommend that the authors consider expanding the scope to include multivariable analysis. The current focus on single-variable quadratic polynomials limits the applicability of the tool in more complex, real-world scenarios where multivariable models are often required. By incorporating or discussing multivariable quadratic polynomial models, the article would significantly enhance its relevance and utility for a broader audience.</p>
            <p> </p>
            <p> 
                <bold>Conclusion:</bold> I approve the article for indexing but strongly recommend including multivariable analysis in the current version or future updates. This addition would greatly improve the comprehensiveness and applicability of the tool, making it even more valuable for the research community.</p>
            <p>Are the conclusions about the tool and its performance adequately supported by the findings presented in the article?</p>
            <p>Yes</p>
            <p>Is the rationale for developing the new software tool clearly explained?</p>
            <p>Yes</p>
            <p>Is the description of the software tool technically sound?</p>
            <p>Yes</p>
            <p>Are sufficient details of the code, methods and analysis (if applicable) provided to allow replication of the software development and its use by others?</p>
            <p>Yes</p>
            <p>Is sufficient information provided to allow interpretation of the expected output datasets and any results generated using the tool?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Mathematical modeling, Discrete computer modeling and simulation, Machine learning, and Data analytics</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report290970">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.163848.r290970</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Wang</surname>
                        <given-names>Qiao</given-names>
                    </name>
                    <xref ref-type="aff" rid="r290970a1">1</xref>
                    <xref ref-type="aff" rid="r290970a2">2</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-5271-0472</uri>
                </contrib>
                <aff id="r290970a1">
                    <label>1</label>Southeast University, Nanjing,, China</aff>
                <aff id="r290970a2">
                    <label>2</label>School of Economics and Management, Southeast University, Nanjing, China</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>8</day>
                <month>8</month>
                <year>2024</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2024 Wang Q</copyright-statement>
                <copyright-year>2024</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport290970" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.149391.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>This paper explores modelling using quadratic polynomials in Python for data analysis applications. However, the study is limited to the single variable case, which does not meet the standards of current applications. In regression analysis, multivariate quadratic polynomial models or more generalized higher order polynomial regressions are typically used, but these crucial aspects are not covered in the current work.&#x00a0; I have comments as below:</p>
            <p> </p>
            <p> 1.&#x00a0;The "methods"&#x00a0; outlined in this article lack distinction, since it is a naive description on tool software; as a research article, they should be more prominently highlighted.</p>
            <p> </p>
            <p> 2.&#x00a0;The quadratic polynomial discussed in Section 2.1 mainly addresses the single-variable case. However, in a broader viewpoint, polynomial regression encompasses multivariable contexts, with its theoretical underpinnings and algorithms applied across various fields. I believe the explanation in this section could be revised and enhanced extensively.</p>
            <p> </p>
            <p> 3.&#x00a0;This entire subsection 2.1 could be reformulated using quadratic forms, along with pertinent linear algebra and matrix theory. Failing to do so would limit the model to a single-variable scenario.</p>
            <p> </p>
            <p> 4.&#x00a0;Section 3 solely demonstrates a standard example in the single-variable scenario. However, I recommend improving the clarity of its capabilities and limitations by introducing a counterexample, such as a dataset that fits well with a cubic curve but may fail when approximated with quadratic polynomial models.</p>
            <p> </p>
            <p> To summarize, this article's discussion on the Python library for quadratic regression modeling is limited to single-variable scenarios and does not effectively showcase the model's fitting capabilities. In my opinion, the content is overly simplistic and does not adequately address practical data analysis applications. Therefore, a thorough major revision is necessary.</p>
            <p>Are the conclusions about the tool and its performance adequately supported by the findings presented in the article?</p>
            <p>Partly</p>
            <p>Is the rationale for developing the new software tool clearly explained?</p>
            <p>No</p>
            <p>Is the description of the software tool technically sound?</p>
            <p>No</p>
            <p>Are sufficient details of the code, methods and analysis (if applicable) provided to allow replication of the software development and its use by others?</p>
            <p>No</p>
            <p>Is sufficient information provided to allow interpretation of the expected output datasets and any results generated using the tool?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Data analytics</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment12208-290970">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Sipakov</surname>
                            <given-names>Rostyslav</given-names>
                        </name>
                        <aff>Environmental Protection, Kyiv National University of Construction and Architecture, Kyiv, Ukraine</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>12</day>
                    <month>8</month>
                    <year>2024</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear&#x00a0;Dr. Wang,</p>
                <p> </p>
                <p> Thank you very much for your review, which is of significant importance to our study.</p>
                <p> </p>
                <p> Although we aimed to present a simple and accessible tool for researchers with basic knowledge of Python programming, the comments from the previous reviewer regarding pre-processing and limitations and your comments regarding multivariate quadratic polynomial models will allow us to present a substantial version of this tool.</p>
                <p> </p>
                <p> For technical reasons, your comments were published after we submitted a new version (revision 1) of the manuscript to the editorial office based on the previous reviewer's comments. Nevertheless, we have begun work on a new version (revision 2) of the manuscript to reflect your valuable comments.</p>
                <p> </p>
                <p> Thank you once again for providing the opportunity to significantly improve our study.</p>
                <p> </p>
                <p> Sincerely,</p>
                <p> Dr. Sipakov</p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report305465">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.163848.r305465</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Molla</surname>
                        <given-names>Selim</given-names>
                    </name>
                    <xref ref-type="aff" rid="r305465a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0009-0007-2969-2791</uri>
                </contrib>
                <aff id="r305465a1">
                    <label>1</label>The University of Texas at El Paso, El Paso, Texas, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>29</day>
                <month>7</month>
                <year>2024</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2024 Molla S</copyright-statement>
                <copyright-year>2024</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport305465" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.149391.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The article is fundamentally sound and makes a significant contribution to the application of quadratic polynomials in data analysis using Python. However, to enhance clarity, completeness, and practical utility, the following revisions are recommended:</p>
            <p> </p>
            <p> 
                <underline>
                    <bold>Introduction: Detailed Explanation of Suitability</bold>
                </underline>
            </p>
            <p> 
                <bold>Improvement:</bold> Provide a more detailed explanation of why quadratic polynomials are particularly suitable for modelling and analysing data, compared to other polynomial or non-linear models.</p>
            <p> 
                <bold>Details:</bold> Explain the unique advantages of quadratic polynomials in capturing curvature and non-linear relationships. Compare briefly with other models (e.g., linear, cubic polynomials) to highlight the specific scenarios where quadratic polynomials are most effective.</p>
            <p> 
                <underline>
                    <bold>Methods: Data Preprocessing Steps</bold>
                </underline>
            </p>
            <p> 
                <bold>Improvement:</bold> Include a more detailed explanation of the data preprocessing steps, such as handling missing values or outliers.</p>
            <p> 
                <bold>Details:</bold> Add a subsection detailing the preprocessing steps taken before fitting the quadratic model. This should include techniques for handling missing data, outlier detection and treatment, and any data normalization or scaling applied.</p>
            <p> 
                <underline>
                    <bold>Methods: Discussion of R-squared Limitations</bold>
                </underline>
            </p>
            <p> 
                <bold>Improvement:</bold> Briefly discuss the limitations of using R-squared as the sole measure of model fit and suggest additional metrics.</p>
            <p> 
                <bold>Details:</bold> Include a paragraph explaining that while R-squared is useful, it has limitations, especially in non-linear contexts. Suggest other metrics like Adjusted R-squared, Mean Squared Error (MSE), or Root Mean Squared Error (RMSE) to provide a more comprehensive evaluation.</p>
            <p> 
                <underline>
                    <bold>Results: Comparison with Other Models</bold>
                </underline>
            </p>
            <p> 
                <bold>Improvement:</bold> Include a comparison with other models, such as linear regression or higher-degree polynomials, to provide a broader perspective on the performance of quadratic models.</p>
            <p> &#x00a0;
                <bold>Details:</bold> Add a section that compares the performance of quadratic polynomials with linear and cubic models using the same datasets. Use metrics like R-squared, Adjusted R-squared, and MSE to compare the fit and predictive accuracy.</p>
            <p> 
                <underline>
                    <bold>Discussion: Challenges and Limitations</bold>
                </underline>
            </p>
            <p> 
                <bold>Improvement:</bold> Delve deeper into the potential challenges and limitations of quadratic polynomials, such as overfitting or sensitivity to data variability.</p>
            <p> 
                <bold>Details:</bold> Discuss scenarios where quadratic polynomials might overfit, particularly with small or noisy datasets. Provide suggestions for mitigating these issues, such as regularization techniques or cross-validation methods. Mention the sensitivity of quadratic models to data variability and how to handle such cases.</p>
            <p>Are the conclusions about the tool and its performance adequately supported by the findings presented in the article?</p>
            <p>Yes</p>
            <p>Is the rationale for developing the new software tool clearly explained?</p>
            <p>Yes</p>
            <p>Is the description of the software tool technically sound?</p>
            <p>Yes</p>
            <p>Are sufficient details of the code, methods and analysis (if applicable) provided to allow replication of the software development and its use by others?</p>
            <p>Yes</p>
            <p>Is sufficient information provided to allow interpretation of the expected output datasets and any results generated using the tool?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Mathematical modeling, Discrete computer modeling and simulation, Machine learning, and Data analytics</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment12123-305465">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Sipakov</surname>
                            <given-names>Rostyslav</given-names>
                        </name>
                        <aff>Environmental Protection, Kyiv National University of Construction and Architecture, Kyiv, Ukraine</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>1</day>
                    <month>8</month>
                    <year>2024</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear&#x00a0;Selim Molla,</p>
                <p> </p>
                <p> Thank you very much for your valuable comments. Based on your comments, we have revised and highlighted the article in red font.&#x00a0;Due to the significant volume of changes we have made, including new figures, we provide a brief description of what we have done below.</p>
                <p> </p>
                <p> The full text of the preprint of revision 1 can be obtained via the following link: https://arxiv.org/abs/2402.06133.</p>
                <p> Please wait for the updated version (version 3) to be published.</p>
                <p> Announcement Schedule&#x00a0;Thursday 20:00 (08/01/2024)</p>
                <p> </p>
                <p> Also, a new version has been submitted to the editorial office, and we hope it will be published soon.&#x00a0;Within one business day, we will also publish the updated code on GitHub.</p>
                <p> </p>
                <p> 
                    <bold>What has been done:</bold>
                </p>
                <p> </p>
                <p> 
                    <bold>Point 1.</bold>&#x00a0;Introduction: Detailed Explanation of Suitability.</p>
                <p> 
                    <bold>Response 1:</bold>&#x00a0;This paper highlights quadratic polynomials' unique advantages in capturing curvature and non-linear relationships. It also includes a brief comparison with other models, such as linear and cubic polynomials, emphasizing specific scenarios where quadratic polynomials are most effective.</p>
                <p> </p>
                <p> 
                    <bold>Point 2:</bold> Methods: Data Preprocessing Steps</p>
                <p> 
                    <bold>Response 2:&#x00a0;</bold>A new subsection has been added detailing the preprocessing steps undertaken before fitting the quadratic model. This includes techniques for handling missing data, detecting and treating outliers, and applying data normalization or scaling. This addition aims to provide a clearer understanding of the steps taken to prepare the data for analysis.</p>
                <p> </p>
                <p> 
                    <bold>Point 3: </bold>Methods: Discussion of R-squared Limitations</p>
                <p> 
                    <bold>Response 3:&#x00a0;</bold>The methods section now contains a paragraph discussing the limitations of using R-squared as the sole measure of model fit. It suggests additional metrics such as Adjusted R-squared, Mean Squared Error (MSE), and Root Mean Squared Error (RMSE) to offer a more comprehensive evaluation of model performance.</p>
                <p> </p>
                <p> 
                    <bold>Point 4:</bold>&#x00a0;Results: Comparison with Other Models</p>
                <p> 
                    <bold>Response 4:&#x00a0;</bold>A new section has been included comparing the performance of quadratic polynomials with linear and cubic models using the same datasets. The comparison uses metrics like R-squared, Adjusted R-squared, and MSE to evaluate the fit and predictive accuracy, providing a broader perspective on the effectiveness of quadratic models.</p>
                <p> </p>
                <p> 
                    <bold>Point 5:</bold>&#x00a0;Discussion: Challenges and Limitations</p>
                <p> 
                    <bold>Response 5:&#x00a0;</bold>The discussion now delves deeper into the potential challenges and limitations of quadratic polynomials, such as overfitting and sensitivity to data variability. It addresses scenarios where quadratic polynomials might overfit, particularly with small or noisy datasets, and suggests methods for mitigating these issues, including regularization techniques and cross-validation methods. This addition aims to provide a more balanced view of the use of quadratic polynomials in data analysis.</p>
            </body>
        </sub-article>
        <sub-article article-type="response" id="comment12264-305465">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Sipakov</surname>
                            <given-names>Rostyslav</given-names>
                        </name>
                        <aff>Environmental Protection, Kyiv National University of Construction and Architecture, Kyiv, Ukraine</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>20</day>
                    <month>8</month>
                    <year>2024</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear&#x00a0;Selim Molla,</p>
                <p> </p>
                <p> We have received a notification from the editorial board that version 2 of our manuscript has been publicly published. However, we are currently working on version 3 to address the comments provided by another reviewer. Nonetheless, we would greatly appreciate your feedback regarding your significant conceptual remarks, which we have endeavored to incorporate into version 2 of our manuscript. Once again, thank you very much for your attention and for providing valuable conceptual insights into our work.</p>
                <p> </p>
                <p> Sincerely,</p>
                <p> Dr. Sipakov</p>
            </body>
        </sub-article>
    </sub-article>
</article>
