<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.170647.1</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Research Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Dependency&#x2011;Light ML Forecasts of ASEAN Smoking Prevalence with Uncertainty &amp; Policy Scenarios (1990&#x2011;2035)</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 1; peer review: 1 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Ahmad</surname>
                        <given-names>Awab</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0006-7376-9875</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Aleem</surname>
                        <given-names>Rida</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Ahmad</surname>
                        <given-names>Mahmood</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <uri content-type="orcid">https://orcid.org/0000-0001-9107-3704</uri>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>St George's University of London, London, England, UK</aff>
                <aff id="a2">
                    <label>2</label>Royal Free Hospital, Royal Free London NHS Foundation Trust, London, England, UK</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:m2100124@sgul.ac.uk">m2100124@sgul.ac.uk</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>10</day>
                <month>4</month>
                <year>2026</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2026</year>
            </pub-date>
            <volume>15</volume>
            <elocation-id>500</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>11</day>
                    <month>3</month>
                    <year>2026</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Ahmad A et al.</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/15-500/pdf"/>
            <abstract>
                <sec>
                    <title>Background</title>
                    <p>Within the ASEAN region, smoking is one of the leading preventable causes of death, contributing to over 10% of all global smoking-related deaths. Accurate policy modelling and effective forecasting are therefore vital to support strategies that aim to control tobacco regionally.</p>
                </sec>
                <sec>
                    <title>Methods</title>
                    <p>Our study created an installation-free, open-source machine learning model that could predict smoking prevalence and simulate the potential effect of a 15% tobacco tax rise within the 11 ASEAN countries. This was done by clustering countries based on historical prevalence using dynamic time warping k-means (DTW-kM). The performance of the model was then compared with the traditional autoregressive integrated moving average (ARIMA) approach, which used mean absolute error (MAE) as the primary accuracy metric.</p>
                </sec>
                <sec>
                    <title>Results</title>
                    <p>Compared to the traditional ARIMA, the stacked long short term memory (LSTM) model performed better in forecasting accuracy (median MAE 0.32 vs 0.46 percentage points, p&#x00a0;&lt;&#x00a0;0.01). If no intervention is made, the smoking prevalence across the ASEAN region will fall from 26.35 (2022) to 24.6% by 2035. Implementing a 15% tax rise in 2026 improves this percentage to 22.0% which averts 1.3 million disability-adjusted life years (DALYs).</p>
                </sec>
                <sec>
                    <title>Conclusion</title>
                    <p>This openly accessible tool therefore supports evidence-based tobacco policy and provides a reproducible, data-driven approach to forecast tobacco use trends and evaluate the effect of policy interventions.</p>
                </sec>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Smoking prevalence; ASEAN; Machine learning; Forecasting; Tobacco tax; Public health policy</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="https://doi.org/10.13039/501100004337">
                    <funding-source>St. George's, University of London</funding-source>
                </award-group>
                <funding-statement>The author(s) declared that no grants were involved in supporting this work.</funding-statement>
            </funding-group>
        </article-meta>
    </front>
    <body>
        <sec id="sec5" sec-type="intro">
            <title>Introduction</title>
            <p>Smoking is one of the major causes of preventable death in the ASEAN region, accounting for over 10% of all global smoking related deaths (
                <xref ref-type="bibr" rid="ref2">Dai et al., 2025</xref>). Despite the World Health Organization&#x2019;s (WHO) target to reduce adult smoking prevalence by 30% from 2010 to 2030, there has been limited progress across ASEAN countries (
                <xref ref-type="bibr" rid="ref7">World Health Organization, 2023</xref>). The smoking trends for the ASEAN countries were clustered (
                <xref ref-type="fig" rid="f1">
Figure 1</xref>) and forecasted aggregate smoking prevalence can also be seen (
                <xref ref-type="fig" rid="f2">
Figure 2</xref>). Few studies have explored the impact of future policies on this goal and have used complex methods that are difficult to reproduce.</p>
            <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                <label>
Figure 1. </label>
                <caption>
                    <title>Smoking prevalence trends in 11 ASEAN countries, 1990&#x2013;2022.</title>
                    <p>The age standardized smoking prevalence rates for all 11 ASEAN countries can be seen over the period of 1990&#x2013;2022 for both sexes. Each coloured line represents a different country indicated by the key and illustrates historical trends in smoking prevalence.</p>
                </caption>
                <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/188135/cc6441e1-d3e6-4e1f-bb73-da93ed78c946_figure1.gif"/>
            </fig>
            <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                <label>
Figure 2. </label>
                <caption>
                    <title>ASEAN aggregate smoking prevalence: observed vs forecast.</title>
                    <p>The forecasted age standardized smoking prevalence rates for both sexes were generated using the stacked LSTM model based on previous trends. The dashed lines represent the predicted average prevalence across all ASEAN countries from 2023 to 2035. The solid line illustrates the actual observed average smoking prevalence for all 11 ASEAN countries from 1990 to 2022.</p>
                </caption>
                <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/188135/cc6441e1-d3e6-4e1f-bb73-da93ed78c946_figure2.gif"/>
            </fig>
            <p>Long short-term memory (LSTM) networks are types of machine learning (ML) models that have proven to be promising in forecasting public health trends and predicting future behaviours (
                <xref ref-type="bibr" rid="ref3">Hochreiter and Schmidhuber, 1997</xref>). These models have performed well in predicting infectious disease outbreaks but have not been used in tobacco control.</p>
            <p>This study aimed to build a ML tool that could be operated without additional software and could: help group ASEAN countries based on past smoking trends, produce reliable forecasts up to 2035 and thirdly simulate the impact on health of introducing new policies such as increased tobacco tax.</p>
        </sec>
        <sec id="sec6" sec-type="methods">
            <title>Method</title>
            <sec id="sec7">
                <title>Data sources</title>
                <p>Open-access datasets from the Global Burden of Disease Study 2021 were used (
                    <xref ref-type="bibr" rid="ref2">Dai et al., 2025</xref>) to access age-standardized smoking prevalence rates from 1990&#x2013;2022 for 11 ASEAN countries (
                    <xref ref-type="bibr" rid="ref5">Institute for Health Metrics and Evaluation, 2024b</xref>). Alongside this, additional variables such as GDP per capita, tobacco tax levels and tobacco control scores were included if available. Smoking attributable disease burden (DALYs) were also collected from Global Burden of Disease 2021 (GBD 2021) (
                    <xref ref-type="bibr" rid="ref4">Institute for Health Metrics and Evaluation, 2024a</xref>).</p>
            </sec>
            <sec id="sec8">
                <title>Pre-processing and clustering</title>
                <p>Of the data collected, we filtered out only age-standardised, both sex prevalence rates that had no missing values and each country&#x2019;s smoking history was presented as a 33-year timeline. The 11 countries were then grouped into three clusters using a time series method called Dynamic Time Warping (DTW-kM). When this was unavailable, the system defaulted to a simpler method using Euclidean distance.</p>
            </sec>
            <sec id="sec9">
                <title>Forecasting</title>
                <p>We built a machine learning model (stacked LSTM network) that predicted future smoking trends based on the past six years of data. This model&#x2019;s output was then compared with two current baselines: ARIMA (a traditional statistical model) and a naive model, which assumed no change. Dropout sampling was also used to estimate uncertainty, and built-in validation was used to compare forecast accuracy from 2018&#x2013;2022.</p>
            </sec>
            <sec id="sec10">
                <title>Policy simulation</title>
                <p>Policy changes were simulated using a tool in the model such as a 15% tobacco tax rise in 2026 which was modelled to estimate its effect on smoking rates and related disease burden. DALYs were adjusted based on known elasticities (0.7% DALY reduction per 1% drop in prevalence) (
                    <xref ref-type="bibr" rid="ref6">Nazar et al., 2021</xref>).</p>
            </sec>
            <sec id="sec11">
                <title>Reproducibility</title>
                <p>The entire system is very reproducible as it runs in under 5&#x00a0;seconds and logs all code version and data hashes which ensures transparency.</p>
            </sec>
        </sec>
        <sec id="sec12" sec-type="results">
            <title>Results</title>
            <p>The 11 ASEAN countries were categorized into three main groups based on their smoking trends:</p>
            <p>Early Convergers &#x2013; Singapore, Brunei: had already reduced smoking prevalence to below 15% by 2022.</p>
            <p>Mid Decliners &#x2013; Malaysia, Philippines, Thailand: have experienced a steady decline of 1.2 percentage points (pp) per year since 2005.</p>
            <p>Late Stagnators &#x2013; Indonesia, Myanmar, Vietnam: which still have high smoking rates of around 28% with little recent progress.</p>
            <sec id="sec13">
                <title>Forecasting accuracy</title>
                <p>The LSTM model outperformed the ARIMA model in 9 out of 11 countries. The median absolute error from 2018 to 2022 was lower for LSTM (0.32&#x00a0;pp, 95% CI: 0.26&#x2013;0.40) than for ARIMA (0.46&#x00a0;pp, 95% CI: 0.39&#x2013;0.57), with a statistically significant difference (p&#x00a0;&lt;&#x00a0;0.01).</p>
            </sec>
            <sec id="sec14">
                <title>Future projections</title>
                <p>Based on current trends, the average smoking rate in the ASEAN countries will decrease modestly from 26.3% in 2022 to 24.6% by 2035 if current trends continue. Singapore is the only country projected to achieve the WHO target of less than 30% by 2030 (
                    <xref ref-type="bibr" rid="ref7">World Health Organization, 2023</xref>).</p>
            </sec>
            <sec id="sec15">
                <title>Tax simulation</title>
                <p>On introduction of a tobacco tax of 15% in 2026, the expected prevalence in 2035 drops to 22% which could prevent 1.3 million smoking related DALYs across the region from a single policy.</p>
            </sec>
            <sec id="sec16">
                <title>Sensitivity checks</title>
                <p>Adjusting the settings of the model e.g. adding more country clusters or longer input data windows had very minimal effects on the overall results which affirms the stability of the model.</p>
            </sec>
        </sec>
        <sec id="sec17" sec-type="discussion">
            <title>Discussion</title>
            <p>This lightweight machine learning tool is the first that has been developed to forecast smoking prevalence across ASEAN countries. The study creates opportunities for shared learning and policy collaboration as it groups countries based on past smoking trends. For example, Malaysia&#x2019;s trajectory closely mirrors that of the Philippines and Thailand, while Indonesia&#x2019;s trends resemble those of Myanmar and Vietnam.</p>
            <p>The results show that LSTM models have higher accuracy when compared to traditional ARIMA methods which is also consistent with what has been seen in infectious disease forecasting. The LSTM model is highly practical in low-resource settings such as government health departments or public health NGOs due to it not requiring external software installations.</p>
            <p>Based on current policies, without stronger action, most ASEAN countries will clearly not meet the WHO target of a 30% reduction in smoking prevalence by 2030. Smoking rates could be significantly reduced, and over 1 million years of life lost to smoking-related disease could be prevented with interventions such as a 15% increase in tobacco taxes.</p>
            <sec id="sec18">
                <title>Limitations</title>
                <p>

                    <list list-type="bullet">
                        <list-item>
                            <label>-</label>
                            <p>The smoking trends were not modelled by age group</p>
                        </list-item>
                        <list-item>
                            <label>-</label>
                            <p>The relationship between prevalence reduction and DALYs was assumed to be linear</p>
                        </list-item>
                        <list-item>
                            <label>-</label>
                            <p>Newly emerging trends such as vaping and e-cigarette use were not included or investigated in the study</p>
                        </list-item>
                    </list>
                </p>
            </sec>
            <sec id="sec19">
                <title>Future directions</title>
                <p>In the future, more detailed data such as age and income could be incorporated. The model could also be expanded by exploring e-cigarette usage and vaping using advanced machine learning methods such as Temporal Fusion Transformers to improve the accuracy and applicability of the study.</p>
            </sec>
        </sec>
        <sec id="sec20" sec-type="conclusion">
            <title>Conclusion</title>
            <p>We developed a simple machine learning tool that does not require installation and can predict smoking trends while assessing policy impacts across ASEAN. Based on our analysis, most countries will not achieve the WHO target unless stronger tobacco control measures are implemented. Even a modest tax increase could avoid over a million DALYs. The overall framework is also adaptable to other public health areas without external software installation.</p>
        </sec>
        <sec id="sec21">
            <title>Software availability</title>
            <p>Source code available from: 
                <ext-link ext-link-type="uri" xlink:href="https://github.com/awabahmad469/smoking-analysis">https://github.com/awabahmad469/smoking-analysis
</ext-link>
            </p>
            <p>Archived source code at: 
                <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.17499927">https://doi.org/10.5281/zenodo.17499927</ext-link>
            </p>
            <p>License: MIT.</p>
            <p>This software is based on code originally published by Mahmood Ahmad (DOI: 
                <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.17095791">https://doi.org/10.5281/zenodo.17095791</ext-link>) and has been reused and extended with permission under the MIT License.</p>
        </sec>
        <sec id="sec22">
            <title>Ethics and consent</title>
            <p>Ethical approval and consent were not required for this study as it used publicly available, deidentified datasets and there was no direct involvement from human participants.</p>
            <p>The primary data on smoking prevalence and disease burden were obtained from the Institute for Health Metrics and Evaluation (IHME) Global Burden of Disease Study 2021, accessible at 
                <ext-link ext-link-type="uri" xlink:href="https://ghdx.healthdata.org/record/ihme-data/gbd-2021-asean-smoking-prevalence-burden-1990-2021">https://ghdx.healthdata.org/record/ihme-data/gbd-2021-asean-smoking-prevalence-burden-1990-2021</ext-link> (accessed 30 July 2025).</p>
            <p>Additional variables and processed datasets generated for analysis, including extrapolations to 2022 and policy simulation inputs, are publicly archived on Zenodo at 
                <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.17095791">https://doi.org/10.5281/zenodo.17095791</ext-link>, enabling full reproducibility by readers and reviewers.</p>
        </sec>
    </body>
    <back>
        <sec id="sec25" sec-type="data-availability">
            <title>Data availability</title>
            <p>The dataset used in this study is publicly available from Mahmood 
                <xref ref-type="bibr" rid="ref1">Ahmad (2025)</xref>, &#x201c;Smoking&#x201d;, Zenodo, 
                <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.17095791">https://doi.org/10.5281/zenodo.17095791</ext-link>.</p>
            <p>The data can be accessed by any reader without registration, and reuse is permitted under the 
                <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution 4.0 International</ext-link> (CC BY 4.0) license, with appropriate attribution to the original author.</p>
        </sec>
        <ack>
            <title>Acknowledgments</title>
            <p>Portions of the Python code archived on Zenodo were drafted with assistance from ChatGPT (o3-mini) and used to help in code development. All outputs were reviewed, tested, and validated by the authors.</p>
        </ack>
        <ref-list>
            <title>References</title>
            <ref id="ref1">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ahmad</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>Smoking datasets used in &#x201c;Forecasting smoking prevalence in ASEAN countries using machine learning&#x201d;.</article-title>
                    <source>

                        <italic toggle="yes">Zenodo.</italic>
</source>
                    <year>2025</year>. (Accessed: 11 September 2025).
                    <pub-id pub-id-type="doi">10.5281/zenodo.17095791</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Dai</surname>
                            <given-names>X</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ng</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gil</surname>
                            <given-names>GF</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The epidemiology and burden of smoking in countries of the Association of Southeast Asian Nations (ASEAN), 1990&#x2013;2021: findings from the Global Burden of Disease Study 2021.</article-title>
                    <source>

                        <italic toggle="yes">Lancet Public Health.</italic>
</source>
                    <year>2025</year>;<volume>10</volume>(<issue>6</issue>):<fpage>e442</fpage>&#x2013;<lpage>e455</lpage>.
                    <pub-id pub-id-type="pmid">40441812</pub-id>
                    <pub-id pub-id-type="doi">10.1016/s2468-2667(24)00326-8</pub-id>
                    <pub-id pub-id-type="pmcid">PMC12127265</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Hochreiter</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Schmidhuber</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <article-title>Long short-term memory.</article-title>
                    <source>

                        <italic toggle="yes">Neural Comput.</italic>
</source>
                    <year>1997</year>;<volume>9</volume>(<issue>8</issue>):<fpage>1735</fpage>&#x2013;<lpage>1780</lpage>.
                    <pub-id pub-id-type="doi">10.1162/neco.1997.9.8.1735</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <mixed-citation publication-type="other">
                    <collab>Institute for Health Metrics and Evaluation</collab>:
                    <article-title>Global Burden of Disease 2021: Findings from the GBD 2021 Study.</article-title>
                    <year>2024a</year>;<fpage>17</fpage>. (Accessed: 31 July 2025).
                    <ext-link ext-link-type="uri" xlink:href="https://www.healthdata.org/sites/default/files/2024-05/GBD_2021_Booklet_FINAL_2024.05.16.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref5">
                <mixed-citation publication-type="other">
                    <collab>Institute for Health Metrics and Evaluation</collab>:
                    <article-title>Global Burden of Disease (GBD 2021) ASEAN Smoking Prevalence &amp; Burden 1990&#x2013;2021. Global Health Data Exchange.</article-title>
                    <year>2024b</year>. (Accessed: 30 July 2025).
                    <ext-link ext-link-type="uri" xlink:href="https://ghdx.healthdata.org/record/ihme-data/gbd-2021-asean-smoking-prevalence-burden-1990-2021">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Nazar</surname>
                            <given-names>GP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sharma</surname>
                            <given-names>N</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Chugh</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Impact of tobacco price and taxation on affordability and consumption of tobacco products in the South-East Asia Region: A systematic review.</article-title>
                    <source>

                        <italic toggle="yes">Tob. Induc. Dis.</italic>
</source>
                    <year>2021</year>:<volume>19</volume>:<fpage>1</fpage>,<lpage>17</lpage>. (Accessed: 31 July 2025).
                    <pub-id pub-id-type="pmid">34992513</pub-id>
                    <pub-id pub-id-type="doi">10.18332/tid/143179</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8669701</pub-id>
                    <ext-link ext-link-type="uri" xlink:href="https://www.researchgate.net/publication/357186338_Impact_of_tobacco_price_and_taxation_on_affordability_and_consumption_of_tobacco_products_in_the_South-East_Asia_Region_A_systematic_review">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref7">
                <mixed-citation publication-type="other">
                    <collab>World Health Organization</collab>:
                    <article-title>Implementation roadmap 2023&#x2013;2030 for the Global action plan for the prevention and control of noncommunicable diseases.</article-title>
                    <year>2023</year>. (Accessed: 31 July 2025).
                    <ext-link ext-link-type="uri" xlink:href="https://www.who.int/teams/noncommunicable-diseases/governance/roadmap">Reference Source</ext-link>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report475280">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.188135.r475280</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Mart&#x00ed;n-&#x00c1;lvarez</surname>
                        <given-names>Juan Manuel</given-names>
                    </name>
                    <xref ref-type="aff" rid="r475280a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r475280a1">
                    <label>1</label>Universidad Internacional de La Rioja (UNIR), Logro&#x00f1;o, Spain</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>6</day>
                <month>6</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Mart&#x00ed;n-&#x00c1;lvarez JM</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport475280" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.170647.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>This article addresses an important public health issue by developing a machine learning framework to forecast smoking prevalence in ASEAN countries and simulate the impact of tobacco taxation policies. The study is timely, relevant, and has clear potential for policy application, particularly given its emphasis on accessibility and reproducibility through an open-source, installation-free tool.</p>
            <p> The manuscript is generally well structured and clearly written. The objectives are well defined, and the results are presented in a straightforward manner. The comparison between LSTM and ARIMA models is useful, and the inclusion of policy simulation represents a valuable attempt to move from prediction to decision support.</p>
            <p> However, several aspects require further development to ensure scientific robustness.</p>
            <p> First, the methodological description is insufficiently detailed. Key elements of the LSTM model&#x2014;such as architecture, hyperparameters, training procedure, and validation strategy&#x2014;are not fully specified, which limits reproducibility.</p>
            <p> Second, the modeling framework is relatively limited. The comparison is restricted to ARIMA and a na&#x00ef;ve baseline, whereas the current literature supports the use of more advanced and hybrid approaches. For example, recent work combining econometric and machine learning models in a counterfactual framework has demonstrated improved robustness, interpretability, and policy relevance (refer 1).</p>
            <p> Third, the policy simulation approach relies on simplified assumptions, particularly the linear relationship between prevalence reduction and DALYs. This assumption may not adequately capture real-world nonlinearities or cross-country heterogeneity, and therefore the policy conclusions should be interpreted with caution.</p>
            <p> Fourth, the statistical evaluation could be strengthened. The study relies primarily on MAE, while additional metrics (e.g., RMSE, MAPE) and robustness checks would provide a more comprehensive assessment of model performance.</p>
            <p> Fifth, although the discussion is generally appropriate, some conclusions are stated too strongly given the limitations of the modeling approach. In particular, the manuscript does not clearly distinguish between predictive simulation and causal inference, which may lead to overinterpretation of policy effects.</p>
            <p> Finally, the manuscript would benefit from stronger engagement with recent literature on counterfactual modeling and hybrid forecasting approaches in public health, which provide more robust frameworks for evaluating policy impacts.</p>
            <p> In conclusion, this is a promising and relevant contribution with practical value, but it requires 
                <bold>major revisions</bold> to improve methodological transparency, strengthen the analytical framework, and moderate the interpretation of results.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Partly</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Partly</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Partly</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Public health analytics, time-series econometrics, machine learning applications in health, and policy evaluation. I am particularly familiar with forecasting methods, counterfactual analysis, and the assessment of public health interventions using statistical and hybrid ML approaches.</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-475280-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>The long-term impact of Spain's 2010 Anti-Smoking Law: A counterfactual and prospective time-series analysis</article-title>.
                        <source>
                            <italic>AIMS Public Health</italic>
                        </source>.<year>2026</year>;<volume>13</volume>(<issue>1</issue>) :
                        <elocation-id>10.3934/publichealth.2026011</elocation-id>
                        <fpage>178</fpage>-<lpage>203</lpage>
                        <pub-id pub-id-type="doi">10.3934/publichealth.2026011</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
    </sub-article>
</article>
