<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.54449.2</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Research Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Philympics 2021: Prophage Predictions Perplex Programs</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 2; peer review: 1 approved, 1 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Roach</surname>
                        <given-names>Michael J.</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-1488-5148</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>McNair</surname>
                        <given-names>Katelyn</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Michalczyk</surname>
                        <given-names>Maciej</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-7696-1663</uri>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Giles</surname>
                        <given-names>Sarah K</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Inglis</surname>
                        <given-names>Laura K</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Pargin</surname>
                        <given-names>Evan</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Barylski</surname>
                        <given-names>Jakub</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Roux</surname>
                        <given-names>Simon</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Decewicz</surname>
                        <given-names>Przemys&#x0142;aw</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a5">5</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Edwards</surname>
                        <given-names>Robert A.</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Flinders Accelerator for Microbiome Exploration, Flinders University, Adelaide, SA, 5042, Australia</aff>
                <aff id="a2">
                    <label>2</label>Computational Sciences Research Center, San Diego State University, San Diego, CA, 92182, USA</aff>
                <aff id="a3">
                    <label>3</label>Department of Molecular Virology, Institute of Experimental Biology, Faculty of Biology, Adam Mickiewicz University, 61-64 Poznan, Poland</aff>
                <aff id="a4">
                    <label>4</label>DOE Joint Genome Institute, Lawrence Berkeley National Laboratory, Berkeley, CA, 94720, USA</aff>
                <aff id="a5">
                    <label>5</label>Department of Environmental Microbiology and Biotechnology, Institute of Microbiology, Faculty of Biology, University of Warsaw, Warsaw, 02-096, Poland</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:michael.roach@flinders.edu.au">michael.roach@flinders.edu.au</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>8</day>
                <month>4</month>
                <year>2022</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2021</year>
            </pub-date>
            <volume>10</volume>
            <elocation-id>758</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>5</day>
                    <month>4</month>
                    <year>2022</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2022 Roach MJ et al.</copyright-statement>
                <copyright-year>2022</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/10-758/pdf"/>
            <abstract>
                <p>Background</p>
                <p> Most bacterial genomes contain integrated bacteriophages&#x2014;prophages&#x2014;in various states of decay. Many are active and able to excise from the genome and replicate, while others are cryptic prophages, remnants of their former selves. Over the last two decades, many computational tools have been developed to identify the prophage components of bacterial genomes, and it is a particularly active area for the application of machine learning approaches. However, progress is hindered and comparisons thwarted because there are no manually curated bacterial genomes that can be used to test new prophage prediction algorithms.</p>
                <p> Methods</p>
                <p> We present a library of gold-standard bacterial genome annotations that include manually curated prophage annotations, and a computational framework to compare the predictions from different algorithms. We use this suite to compare all extant stand-alone prophage prediction algorithms to identify their strengths and weaknesses. We provide a FAIR dataset for prophage identification, and demonstrate the accuracy, precision, recall, and f
                    <sub>1</sub> score from the analysis of seven different algorithms for the prediction of prophages.</p>
                <p> Results</p>
                <p> We identified different strengths and weaknesses between the prophage prediction tools. Several tools exhibit exceptional f
                    <sub>1</sub> scores, while others have better recall at the expense of more false positives. The tools vary greatly in runtime performance with few exhibiting all desirable qualities for large-scale analyses.</p>
                <p> Conclusions</p>
                <p> Our library of gold-standard prophage annotations and benchmarking framework provide a valuable resource for exploring strengths and weaknesses of current and future prophage annotation tools. We discuss caveats and concerns in this analysis, how those concerns may be mitigated, and avenues for future improvements. This framework will help developers identify opportunities for improvement and test updates. It will also help users in determining the tools that are best suited for their analysis.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>software comparison</kwd>
                <kwd>bioinformatics tool</kwd>
                <kwd>lysogen genome</kwd>
                <kwd>temperate phage</kwd>
                <kwd>prokaryotic virus</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1">
                    <funding-source>NIH National Institute Of Diabetes And Digestive And Kidney Diseases</funding-source>
                    <award-id>RC2DK116713</award-id>
                </award-group>
                <funding-statement>This work supported by the National Institute Of Diabetes And Digestive And Kidney Diseases of the National Institutes of Health under Award Number RC2DK116713 to RAE. The support provided by Flinders University for HPC research resources is acknowledged.</funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Revised</label>
                <title>Amendments from Version 1</title>
                <p>In this version we address the comments of the reviewers. The comparison now includes two additional programs (ProphET and Seeker), and an additional 29 manually-curated genomes to the gold-standard library; we have updated the results accordingly. We compare f1 scores of the different genera that are present in the gold-standard library to assess how the performance of the programs may be influenced by taxonomy. The underlying data now includes our guidelines for manually curating genomes with prophage annotations.</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec id="sec1" sec-type="intro">
            <title>Introduction</title>
            <p>Bacteriophages (phages), viruses that infect bacteria, can be either temperate or virulent. Temperate phages may integrate into their bacterial host genome. Such integrated phage genomes are referred to as prophages and may constitute as much as 20 percent of bacterial DNA (
                <xref ref-type="bibr" rid="ref10">Casjens, 2003</xref>). They replicate as part of the host genomes until external conditions trigger a transition into the virulent lytic cycle, resulting in replication and packaging of phages and typically the death of the host bacteria. Prophages generally contain a set of core genes with a conserved gene order that facilitate integration into the host genome, assembly of phage structural components, replication, and lysis of the host cell (
                <xref ref-type="bibr" rid="ref20">Kang et al., 2017</xref>; 
                <xref ref-type="bibr" rid="ref9">Canchaya et al., 2003</xref>). As well as these core genes, phages can contain an array of accessory metabolic genes that can effect significant phenotypic changes in the host bacteria (
                <xref ref-type="bibr" rid="ref5">Breitbart, 2012</xref>). For instance, many prophages encode virulence factors such as toxins, or fitness factors such as nutrient uptake systems (
                <xref ref-type="bibr" rid="ref6">Br&#x00fc;ssow et al., 2004</xref>). Lastly, many prophages encode a variety of super-infection exclusion mechanisms to prevent concurrent phage infections, including restriction/modification systems, toxin/antitoxin genes, repressors, etc. reviewed in 
                <xref ref-type="bibr" rid="ref39">Abedon (2015</xref>, 
                <xref ref-type="bibr" rid="re40">2019)</xref>. The function of most prophage accessory genes remains unknown.</p>
            <p>Core (pro) phage genes have long been used for identifying prophage regions. However, there are other unique characteristics that can distinguish prophages from their host genomes: bacterial genomes have a GC skew that correlates with the direction of replication, and the insertion of prophages will generally disrupt this GC bias (
                <xref ref-type="bibr" rid="ref16">Grigoriev, 1998</xref>). Transcript direction (
                <xref ref-type="bibr" rid="ref8">Campbell, 2002</xref>) and length of prophage proteins have also proven to be useful metrics in predicting prophages (
                <xref ref-type="bibr" rid="ref1">Akhter et al., 2012</xref>; 
                <xref ref-type="bibr" rid="ref35">Song et al., 2019</xref>), where phage genes are generally smaller and are oriented in the same direction (
                <xref ref-type="bibr" rid="ref11">Dutilh et al., 2014</xref>). Likewise, gene density tends to be higher in phage genomes and intergenic space shorter (
                <xref ref-type="bibr" rid="ref2">Amgarten et al., 2018</xref>; 
                <xref ref-type="bibr" rid="ref25">McNair et al., 2019</xref>).</p>
            <p>Over the last two decades many prophage prediction tools have been developed, and they fall into two broad classes: (1) web-based tools where users upload a bacterial genome and retrieve prophage annotations including 
                <ext-link ext-link-type="uri" xlink:href="https://phaster.ca/">PHASTER</ext-link> (
                <xref ref-type="bibr" rid="ref3">Arndt et al., 2016</xref>), 
                <ext-link ext-link-type="uri" xlink:href="https://pro-hunter.genomics.cn/">Prophage Hunter</ext-link> (
                <xref ref-type="bibr" rid="ref35">Song et al., 2019</xref>), 
                <ext-link ext-link-type="uri" xlink:href="http://aclame.ulb.ac.be/Tools/Prophinder/">Prophinder</ext-link> (
                <xref ref-type="bibr" rid="ref24">Lima-Mendez et al., 2008</xref>), 
                <ext-link ext-link-type="uri" xlink:href="http://computationalbiology.ufpa.br/phageweb/">PhageWeb</ext-link> (
                <xref ref-type="bibr" rid="ref36">Sousa et al., 2018</xref>), and 
                <ext-link ext-link-type="uri" xlink:href="https://rast.nmpdr.org/">RAST</ext-link> (
                <xref ref-type="bibr" rid="ref4">Aziz et al., 2008</xref>); and (2) command-line tools where users download a program and database to run the predictions locally (although some of these also provide a web interface for remote execution). In this work we focus on this latter set of tools (
                <xref ref-type="table" rid="T1">Table 1</xref>) because web-based tools typically do not handle the large numbers of simultaneous requests required to run comparisons across many genomes.</p>
            <table-wrap id="T1" orientation="portrait" position="float">
                <label>Table 1. </label>
                <caption>
                    <title>Prophage identification tools currently included in benchmarking framework.</title>
                </caption>
                <table content-type="article-table" frame="hsides">
                    <thead>
                        <tr>
                            <th align="left" colspan="1" rowspan="1" valign="top">Tool (year)</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Version</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Package manager</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Dependencies</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Database size</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Approach</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Citation</th>
                        </tr>
                    </thead>
                    <tbody>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Phage Finder (2006)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">2.1</td>
                            <td colspan="1" rowspan="1"/>
                            <td align="left" colspan="1" rowspan="1" valign="top">Aragorn, BLAST-legacy, HMMer, Infernal, MUMmer, tRNAscan-SE</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">93 MB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Legacy-BLAST, HMMs</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref12">Fouts, 2006</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">PhiSpy (2012)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">4.2.6</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">conda, pip</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Python3, BioPython, NumPy, SciPy</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">47 MB required, 733 MB optional (pVOGs)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Gene and nucleotide metrics, AT/CG skew, kmer comparison, machine learning, HMMs, annotation keywords</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref1">Akhter et al., 2012</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">VirSorter (2015)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">1.0.6</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">conda</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">MCL, Muscle, BLAST+, BioPerl, HMMer, Diamond, Metagene_annotator</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">13 GB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Alignments, HMMs</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref32">Roux et al., 2015</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">ProphET (2019)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.5.1</td>
                            <td colspan="1" rowspan="1"/>
                            <td align="left" colspan="1" rowspan="1" valign="top">BLAST-legacy, EMBOSS, BedTools, Perl, BioPerl</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">41 Mb</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Legacy-BLAST searches</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref29">Reis-Cunha et al., 2019</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Phigaro (2020)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">2.3.0</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">conda, pip</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Python3, Beautifulsoup4, BioPython, bs4, HMMer, lxml, NumPy, Pandas, Plotly, Prodigal, PyYAML, shsix</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">1.6 GB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">HMMs</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref37">Starikova et al., 2020</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">DBSCAN-SWA (2020)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">2e61b95</td>
                            <td colspan="1" rowspan="1"/>
                            <td align="left" colspan="1" rowspan="1" valign="top">Numpy, BioPython, Scikit-learn, Prokka</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">2.2 GB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Gene metrics, alignments</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref13">Gan et al., 2020</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">VIBRANT (2020)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">1.2.1</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">conda</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Python3, Prodigal, HMMer, BioPython, Pandas, Matplotlib, Seaborn, Numpy, Scikit-learn, Pickle</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">11 GB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">HMMs (KEGG, Pfam, VOG), machine learning</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref22">Kieft et al., 2020</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">Seeker (2020)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">1.0.3</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">pip</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Python3, TensorFlow</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">64 kb</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Machine learning (LSTM)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(Auslander et al., 2020)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">PhageBoost (2021)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">0.1.7</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">pip</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Python3</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">13 MB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Gene and nucleotide metrics, machine learning</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref34">Sir&#x00e9;n et al., 2021</xref>)</td>
                        </tr>
                        <tr>
                            <td align="left" colspan="1" rowspan="1" valign="top">VirSorter2 (2021)</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">2.2.1</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">conda</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Python3, Snakemake, Scikit-learn, imbalanced-learn, Pandas, Seaborn, HMMer, Prodigal, screed</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">12 GB</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">Alignments, HMMs</td>
                            <td align="left" colspan="1" rowspan="1" valign="top">(
                                <xref ref-type="bibr" rid="ref18">Guo et al., 2021</xref>)</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
            <p>Despite the abundance of prophage prediction algorithms, there has never been either a set of reference genomes against which all tools can be compared, nor a unified framework for comparing those tools to identify their relative strengths and weaknesses or to identify opportunities for improvement. We generated a set of manually annotated bacterial genomes released under the FAIR principles (Findable, Accessible, Interoperable, and Reusable), and developed an openly available and accessible framework to compare prophage prediction tools.</p>
        </sec>
        <sec id="sec2" sec-type="methods">
            <title>Methods</title>
            <sec id="sec3">
                <title>Running the tools</title>
                <p>To assess the accuracy of the different prophage prediction tools, a set of 57 gold-standard publicly available bacterial genomes with manually curated prophage annotations was generated. We combined this with the 21 manually annotated genomes described in 
                    <xref ref-type="bibr" rid="ref10">Casjens (2003)</xref> that were not already included for a total of 78 genomes for evaluating the bioinformatics tools. The genomes and prophage annotations currently included are available in Table S1. The genomes are in GenBank format and file conversion scripts are included in the framework to convert those files to formats used by the different software. The tools that are currently included in the framework are outlined in 
                    <xref ref-type="table" rid="T1">Table 1</xref>. Snakemake (
                    <xref ref-type="bibr" rid="ref23">K&#x00f6;ster &amp; Rahmann, 2012</xref>) pipelines utilising conda (Anaconda Software Distribution. 
                    <italic toggle="yes">Conda.</italic> v4.10.1, April 2021 (
                    <ext-link ext-link-type="uri" xlink:href="https://docs.conda.io/en/latest/">Conda</ext-link>, RRID:SCR_018317)) package manager environments were created for each tool to handle the installation of the tool and its dependencies, running of the analyses, output file conversion to a standardized format, and benchmarking of the run stage. Where possible, gene annotations from the GenBank files were used in the analysis to promote consistency between comparisons. DBSCAN-SWA was not able to consistently finish when using GenBank files as input, and instead the genome files in fasta format were used. Another pipeline was created to pool the results from each tool and some comparisons are illustrated in the included Jupyter notebook. Testing and development of the pipelines were conducted on Flinders University&#x2019;s DeepThought HPC infrastructure. The final benchmarking analysis was performed on a stand-alone node consisting of dual Intel&#x00ae; Xeon&#x00ae; Gold 6242R processors (40 cores, 80 threads), 768 GB of RAM, and 58 TB of disk space. Each tool was executed on all genomes in parallel (one thread per job), with no other jobs running. The only exception to this was Seeker which was run one at a time on a single core due to high memory requirements (see below).</p>
                <boxed-text id="B1" orientation="portrait" position="anchor">
                    <label>Box 1. </label>
                    <caption>
                        <title>Benchmark metrics used in this analysis.</title>
                    </caption>
                    <p>
                        <table-wrap id="T100" orientation="portrait" position="anchor">
                            <table content-type="article-table" frame="hsides">
                                <tbody>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">Accuracy was calculated as the ratio of correctly labelled genes to all CDS features from the GenBank file</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <inline-formula>
                                                <mml:math display="inline">
                                                    <mml:mfrac>
                                                        <mml:mrow>
                                                            <mml:mi mathvariant="italic">TP</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mi mathvariant="italic">TN</mml:mi>
                                                        </mml:mrow>
                                                        <mml:mrow>
                                                            <mml:mi mathvariant="italic">TP</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mi mathvariant="italic">TN</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mi mathvariant="italic">FP</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mi mathvariant="italic">FN</mml:mi>
                                                        </mml:mrow>
                                                    </mml:mfrac>
                                                </mml:math>
                                            </inline-formula>
                                        </td>
                                    </tr>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">Precision was calculated as the ratio of correctly labelled phage CDS features to all predicted prophage CDS features</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <inline-formula>
                                                <mml:math display="inline">
                                                    <mml:mfrac>
                                                        <mml:mi mathvariant="italic">TP</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mi mathvariant="italic">TP</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mi mathvariant="italic">FP</mml:mi>
                                                        </mml:mrow>
                                                    </mml:mfrac>
                                                </mml:math>
                                            </inline-formula>
                                        </td>
                                    </tr>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">Recall was calculated as the ratio of correctly labelled prophage CDS features to all known prophage CDS features</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <inline-formula>
                                                <mml:math display="inline">
                                                    <mml:mfrac>
                                                        <mml:mi mathvariant="italic">TP</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mi mathvariant="italic">TP</mml:mi>
                                                            <mml:mo>+</mml:mo>
                                                            <mml:mi mathvariant="italic">FN</mml:mi>
                                                        </mml:mrow>
                                                    </mml:mfrac>
                                                </mml:math>
                                            </inline-formula>
                                        </td>
                                    </tr>
                                    <tr>
                                        <td align="left" colspan="1" rowspan="1" valign="top">The f
                                            <sub>1</sub> Score was calculated as the harmonic mean of Precision and Recall</td>
                                        <td align="left" colspan="1" rowspan="1" valign="top">
                                            <inline-formula>
                                                <mml:math display="inline">
                                                    <mml:mn>2</mml:mn>
                                                    <mml:mo>&#x00d7;</mml:mo>
                                                    <mml:mfrac>
                                                        <mml:mfenced close=")" open="(">
                                                            <mml:mrow>
                                                                <mml:mtext mathvariant="italic">Recall</mml:mtext>
                                                                <mml:mo>&#x00d7;</mml:mo>
                                                                <mml:mtext mathvariant="italic">Precision</mml:mtext>
                                                            </mml:mrow>
                                                        </mml:mfenced>
                                                        <mml:mfenced close=")" open="(">
                                                            <mml:mrow>
                                                                <mml:mtext mathvariant="italic">Recall</mml:mtext>
                                                                <mml:mo>+</mml:mo>
                                                                <mml:mtext mathvariant="italic">Precision</mml:mtext>
                                                            </mml:mrow>
                                                        </mml:mfenced>
                                                    </mml:mfrac>
                                                </mml:math>
                                            </inline-formula>
                                        </td>
                                    </tr>
                                    <tr>
                                        <td colspan="2" rowspan="1">
                                            <italic toggle="yes">Accuracy</italic> provides an overall impression of correctness but is distorted by the vast difference in the numbers of prophage and non-prophage CDS features present in the genomes. The current gold-standard set includes 7,729 prophage proteins and 177,649 non-prophage proteins. Therefore, predicting everything as not coming from a prophage will result in an accuracy of 0.96. Similarly, identifying everything as coming from a prophage will result in high 
                                            <italic toggle="yes">Recall</italic>, since that favours minimising false negatives. In contrast, 
                                            <italic toggle="yes">Precision</italic> favours minimising false-positives and so only predicting very confident regions will result in high precision. The f
                                            <sub>1</sub> Score is the most suitable for comparing predictions as it gives equal weighting to both precision and recall, and thus balances the unevenness inherent in this data.</td>
                                    </tr>
                                </tbody>
                            </table>
                        </table-wrap>
                    </p>
                </boxed-text>
            </sec>
            <sec id="sec4">
                <title>Benchmark metrics</title>
                <p>The runtime and CPU time in seconds, peak memory usage and file write operations were captured by Snakemake (
                    <ext-link ext-link-type="uri" xlink:href="https://bitbucket.org/johanneskoester/snakemake/wiki/">Snakemake</ext-link>, RRID:SCR_003475) for the steps running the prophage tools only (not for any file conversion steps before or after running each tool). The predictions were compared to the gold standard prophage annotations and the number of true positive (TP), true negative (TN), false positive (FP) and false negative (FN) gene labels were used to calculate the performance metrics. Each application marks prophages slightly differently, and therefore we used the designation of coding sequence (CDS) features as phage or not to assess prophage predictions.</p>
            </sec>
            <sec id="sec5">
                <title>Adding new genomes</title>
                <p>We developed the framework to simplify the addition of new genomes to the benchmarks. Each genome is provided in the standard GenBank format, and the prophages are marked by the inclusion of a non-standard flag for each genomic feature that indicates that it is part of a prophage. We use the qualifier
                    <italic toggle="yes">/is_phage=&#x201c;1&#x201d;</italic> to indicate prophage regions. Our guidelines for manually annotating prophages in bacterial genomes are available in the GitHub repository at 
                    <ext-link ext-link-type="uri" xlink:href="https://github.com/linsalrob/ProphagePredictionComparisons/blob/master/Supplementary/prophageAnnotation.md">github.com/linsalrob/ProphagePredictionComparisons/blob/master/Supplementary/prophageAnnotation.md</ext-link>.</p>
            </sec>
        </sec>
        <sec id="sec6" sec-type="results|discussion">
            <title>Results and discussion</title>
            <sec id="sec7">
                <title>Software compared</title>
                <p>We compared the availability, installation, and results from ten different prophage prediction algorithms (
                    <xref ref-type="table" rid="T1">Table 1</xref>). LysoPhD (
                    <xref ref-type="bibr" rid="ref27">Niu et al., 2019</xref>) could not be successfully installed and was not included in the current framework (see below). The remaining ten&#x2014;PhiSpy (
                    <xref ref-type="bibr" rid="ref1">Akhter et al., 2012</xref>), Phage Finder (
                    <xref ref-type="bibr" rid="ref12">Fouts, 2006</xref>), VIBRANT (
                    <xref ref-type="bibr" rid="ref22">Kieft et al., 2020</xref>), VirSorter (
                    <xref ref-type="bibr" rid="ref32">Roux et al., 2015</xref>), Virsorter2 (
                    <xref ref-type="bibr" rid="ref18">Guo et al., 2021</xref>), Phigaro (
                    <xref ref-type="bibr" rid="ref37">Starikova et al., 2020</xref>), PhageBoost (
                    <xref ref-type="bibr" rid="ref34">Sir&#x00e9;n et al., 2021</xref>), DBSCAN-SWA (
                    <xref ref-type="bibr" rid="ref13">Gan et al., 2020</xref>), ProphET (
                    <xref ref-type="bibr" rid="ref29">Reis-Cunha et al., 2019</xref>), and Seeker (Auslander et al., 2020)&#x2014;were each used to predict the prophages in 78 different manually curated microbial genomes.</p>
                <p>Most of these programs utilize protein sequence similarity and HMM searches of core prophage genes to identify prophage regions. PhageBoost leverages a large range of protein features (such as dipeptide and tripeptide combinations) with a trained prediction model. PhiSpy was originally designed to identify prophage regions based upon seven distinct characteristics: protein length, transcript directionality, AT and GC skew, unique phage words, phage insertion points, optionally phage protein similarity and sequence similarity. DBSCAN-SWA likewise uses a range of gene metrics and trained prediction models to identify prophages. Seeker uses a new neural network model applied to bacterial and phage reference genome sequences to classify sequences as phage or bacteria. It was intended for use with sort sequences but can be used to identify prophages.</p>
                <p>Regardless of whether gene annotations are available, Virsorter2, Phigaro, PhageBoost, and ProphET all perform 
                    <italic toggle="yes">de novo</italic> gene prediction with Prodigal (
                    <xref ref-type="bibr" rid="ref19">Hyatt et al., 2010</xref>) and VirSorter uses MetaGeneAnnotator (
                    <xref ref-type="bibr" rid="ref28">Noguchi et al., 2008</xref>) for the same purpose. VIBRANT can take proteins if they have &#x2018;Prodigal format definition lines&#x2019; but otherwise performs predictions with Prodigal. PhageBoost can take existing gene annotations but this requires additional coding by the user. DBSCAN-SWA can take gene annotations or can perform gene predictions with Prokka (
                    <xref ref-type="bibr" rid="ref33">Seemann, 2014</xref>). PhiSpy takes an annotated genome in GenBank format and uses the gene annotations provided.</p>
            </sec>
            <sec id="sec8">
                <title>Ease of installation</title>
                <p>The prophage prediction packages Phigaro, PhiSpy, VIBRANT, VirSorter, and VirSorter2 are all able to be installed with conda from the Bioconda channel (
                    <xref ref-type="bibr" rid="ref17">Gr&#x00fc;ning et al., 2018</xref>), while Phispy, Phigaro, PhageBoost, and Seeker can be installed with pip&#x2014;the Python package installer. Phigaro, VIBRANT, VirSorter, and VirSorter2 require a manual one-time setup to download their respective databases. Phigaro uses hard-coded file paths for its database installation, either to the user&#x2019;s home directory or to a system directory requiring root permissions. Neither option is ideal as it is impossible to have isolated versions or installations of the program, and it prevents updating the installation paths of its dependencies. For PhageBoost to be able to take existing gene annotations, a custom script was created to skip the gene prediction stage and run the program. Basic PhiSpy functionality is provided without requiring third-party databases. However, if the HMM search option is invoked, a database of phage-like proteins&#x2014;e.g. pVOG (
                    <xref ref-type="bibr" rid="ref15">Grazziotin et al., 2017</xref>), VOGdb (
                    <ext-link ext-link-type="uri" xlink:href="https://vogdb.org">https://vogdb.org</ext-link>), or PHROGS (
                    <xref ref-type="bibr" rid="ref38">Terzian P et al., 2021</xref>)&#x2014;must be manually downloaded before it can be included in PhiSpy predictions. DBSCAN-SWA is not currently available on any package manager and must be pulled from GitHub, however all its dependencies are available via conda and it could easily be added in the future. All the above &#x201c;manual&#x201d; installation and setup steps are uncomplicated and are automatically executed by the Snakemake pipelines provided in the framework.</p>
                <p>Phage Finder was last updated in 2006 and is not available on any package manager that we are aware of. The installation process is dated with the package scripts liberally utilising hard-coded file paths. The Snakemake pipeline for this package resolves this with soft links between the framework&#x2019;s directory to the user&#x2019;s home directory (where the package expects to be installed). The dependencies are available via conda allowing the complete installation and setup to be handled automatically by Snakemake.</p>
                <p>Installing and running ProphET is a non-trivial task. It requires the unsupported BLAST legacy and EMBOSS packages and a set of Perl libraries, including a custom library for preparing the necessary GFF files for running the program. The dependencies are mostly available via Conda and the remaining required files are included in this repository. LysoPhD does not appear to be available to download anywhere and was dropped from the comparison.</p>
            </sec>
            <sec id="sec9">
                <title>Prophage prediction performance</title>
                <p>There are many potential ways to compare prophage predictions. For instance, is it more important to capture all prophage regions or minimise false positives? Is it more important to identify all the phage-encoded genes, or the exact locations of the attachment site core duplications (
                    <italic toggle="yes">attL</italic> and 
                    <italic toggle="yes">attR</italic>)? We explore several metrics to highlight the different strengths of each prophage prediction tool. PhiSpy, VIBRANT, Phigaro, and ProphET performed best for mean accuracy (
                    <xref ref-type="fig" rid="f1">Figure 1a</xref>; 
                    <xref ref-type="table" rid="T3">Table 2</xref>) while Seeker and DBSCAN-SWA performed the worst. PhiSpy, Phigaro, Phage Finder, VIBRANT, and ProphET performed best for mean precision (
                    <xref ref-type="fig" rid="f1">Figure 1b</xref>; 
                    <xref ref-type="table" rid="T3">Table 2</xref>). Seeker, DBSCAN-SWA, PhageBoost, VirSorter, and VirSorter2 all performed poorly for mean precision. This was mostly driven by a high false-positive rate compared to the other tools (Figure S1). VirSorter, VirSorter2, VIBRANT, PhiSpy, DBSCAN-SWA, and PhageBoost all had high mean recall scores.</p>
                <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                    <label>Figure 1. </label>
                    <caption>
                        <title>Prediction performance metrics for prophage callers.</title>
                        <p>Violin plots for each tool are shown with individual points for each genome indicated. The graphs show: &#x2018;Accuracy&#x2019; (
                            <italic toggle="yes">a</italic>) as the ratio of correctly labelled genes to all genes, &#x2018;Precision&#x2019; (
                            <italic toggle="yes">b</italic>) as the ratio of correctly labelled phage genes to all predicted phage genes, &#x2018;Recall&#x2019; (
                            <italic toggle="yes">c</italic>) as the ratio of correctly labelled phage genes to all known phage genes, and &#x2018;f
                            <sub>1</sub> Score&#x2019; (
                            <italic toggle="yes">d</italic>) as defined in the methods. For all graphs, more is generally better.</p>
                    </caption>
                    <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/124379/ca54a636-ce96-434b-a31b-eaefc246350d_figure1.gif"/>
                </fig>
                <table-wrap id="T3" orientation="portrait" position="float">
                    <label>Table 2. </label>
                    <caption>
                        <title>Mean metrics for each tool as measured from our gold-standard set of genomes.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="2" valign="bottom">Tool</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">Accuracy</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">Precision</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">Recall</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">f
                                    <sub>
                                        <bold>1</bold>
                                    </sub> score</th>
                            </tr>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">DBSCAN-SWA</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.805</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.293</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.244</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.303</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.558</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.452</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.287</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.332</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Phage Finder</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.962</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0407</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.674</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.386</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.343</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.328</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.404</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.320</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">PhageBoost</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.942</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0423</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.399</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.277</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.667</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.388</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.434</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.265</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Phigaro</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.980</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0232</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.748</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.337</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.566</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.323</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.611</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.320</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">PhiSpy</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.984</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0246</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.772</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.330</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.731</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.309</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.733</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.306</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">ProphET</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.976</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0258</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.646</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.385</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.517</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.357</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.542</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.350</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Seeker</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.582</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.273</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0584</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0746</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.477</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.406</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.093</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.101</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">VIBRANT</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.983</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0246</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.675</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.356</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.702</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.377</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.677</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.355</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">VirSorter</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.955</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0365</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.451</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.288</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.762</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.373</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.532</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.299</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">VirSorter2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.939</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0623</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.399</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.219</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.766</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.372</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.508</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.257</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>Each tool balances between recall and precision. For example, the more conservative Phage Finder performed relatively well in terms of precision, making very confident predictions, but had one of the lower mean recall ratios and was not predicting prophages based on limited information. In contrast, the more speculative DBSCAN-SWA and PhageBoost both exhibited the opposite trend.</p>
                <p>The f
                    <sub>1</sub> Score is a more nuanced metric, as it requires high performance in both precision and recall. PhiSpy, VIBRANT, Phigaro, ProphET, VirSorter, and VirSorter2 all averaged above 0.5, while the remaining tools suffered from many false predictions (FP or FN) (
                    <xref ref-type="fig" rid="f1">Figure 1d</xref>; 
                    <xref ref-type="table" rid="T3">Table 2</xref>).</p>
                <p>Lastly, we visualised f
                    <sub>1</sub> scores for each genus across the tools to elucidate selection biases in the database (Figure S2a). 
                    <italic toggle="yes">Escherichia</italic> appeared to perform either very well or very poorly depending on the tool used but most genera appeared to be less variable between the different tools. We performed Mann-Whitney tests to compare the f
                    <sub>1</sub> scores of each genus against the other genera (Figure S2b). The f
                    <sub>1</sub> scores for 
                    <italic toggle="yes">Streptococcus</italic>, 
                    <italic toggle="yes">Staphylococcus</italic>, 
                    <italic toggle="yes">Listeria</italic>, and 
                    <italic toggle="yes">Burkholderia</italic> were significantly higher than the population average, and the f
                    <sub>1</sub> scores for, 
                    <italic toggle="yes">Ralstonia</italic>, 
                    <italic toggle="yes">Photorhabdus</italic>, Mycobacterium, 
                    <italic toggle="yes">Geobacter</italic>, 
                    <italic toggle="yes">Deinococcus</italic>, 
                    <italic toggle="yes">Cyanobacterium, Brucella</italic>, and 
                    <italic toggle="yes">Bifidobacterium</italic> were significantly lower than the average. An explanation for some of this variation would be that 
                    <italic toggle="yes">Streptococcus</italic> prophages for instance are well studied and highly conserved (
                    <xref ref-type="bibr" rid="ref41">Rezaei Javan et al., 2019</xref>), whilst other genera have been studied less, or their (pro) phages are highly diverse.</p>
            </sec>
            <sec id="sec10">
                <title>Runtime performance</title>
                <p>Many users will not be too concerned about runtime performance, for instance if they are performing a one-off analysis on a genome of interest all the tools will finish in a reasonable time. However, efficient resource utilization is an important consideration for large-scale analyses. Provisioning computing resources costs money and a well optimised tool that runs fast translates to real-world savings. The runtime distributions across the genomes are shown for each tool in 
                    <xref ref-type="fig" rid="f2">Figure 2a</xref> and 
                    <xref ref-type="table" rid="T4">Table 3</xref>. The slowest prophage predictors were generally VirSorter and VirSorter2 with mean runtimes of 1,255 and 1,900 seconds respectively, except for a single DBSCAN-SWA run taking 5,718 seconds. Seeker was the fastest tool (6.65 seconds mean runtime), although this may not be a fair comparison given that multiple instances of this tool were not able to be run at the same time (see below). PhageBoost was the next fastest (37.8 seconds mean runtime) and Phage Finder, Phigaro, PhiSpy, and ProphET all performed similarly well in terms of runtime.</p>
                <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                    <label>Figure 2. </label>
                    <caption>
                        <title>Runtime and peak memory usage comparison.</title>
                        <p>Violin plots for each tool are shown with individual points for each genome indicated. The graphs show total runtime in seconds (
                            <italic toggle="yes">a</italic>), peak memory usage in MB (
                            <italic toggle="yes">b</italic>), total file writes in MB (
                            <italic toggle="yes">c</italic>) and the final total disk usage (all genomes) in MB (
                            <italic toggle="yes">d</italic>). For all graphs, less is better.</p>
                    </caption>
                    <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/124379/ca54a636-ce96-434b-a31b-eaefc246350d_figure2.gif"/>
                </fig>
                <table-wrap id="T4" orientation="portrait" position="float">
                    <label>Table 3. </label>
                    <caption>
                        <title>Summary runtime performance metrics for each tool</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="2" valign="bottom">Tool</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">Runtime (s)</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">Peak RAM (GB)</th>
                                <th align="left" colspan="2" rowspan="1" valign="top">Disk writes (MB)</th>
                                <th align="left" colspan="1" rowspan="2" valign="bottom">Final disk usage (MB)</th>
                            </tr>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">sd</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">DBSCAN-SWA</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">848</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">653</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">8.76</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11.0</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">222</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">342</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">4664</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Phage Finder</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">180</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">71.6</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.932</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1.07</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">5.39</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">5.21</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">699</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">PhageBoost</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">39.8</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">26.4</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1.99</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2.09</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.000769</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.00268</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.149</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Phigaro</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">151</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">48</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.572</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0684</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">6.15</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2.45</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">305</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">PhiSpy</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">147</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">4.56</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.596</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0302</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.427</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2.02</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">20.8</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">ProphET</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">336</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">140</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.690</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.0105</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">38.3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">17.1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1707</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Seeker</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">6.65</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1.45</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75.2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">7.63</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.019</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.00305</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">305</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">VIBRANT</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">798</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">369</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.719</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.381</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">82.4</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">20.1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1567</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">VirSorter</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1255</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">500</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.287</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.229</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2065</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">16.5</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">12482</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">VirSorter2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1900</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">749</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.621</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">0.915</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">31.4</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">15.2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2469</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>Memory requirements also remain an important consideration for provisioning resources for large-scale analyses. For instance, inefficiency is encountered where the memory required by single-threaded processes exceeds the available memory per CPU. Peak memory usage for each tool is shown in 
                    <xref ref-type="fig" rid="f2">Figure 2b</xref> and 
                    <xref ref-type="table" rid="T4">Table 3</xref>. Seeker had by far the highest mean peak memory usage at 75.2 GB. Our approach of running an instance of a tool on each system CPU failed for Seeker due to its extremely high peak RAM usage. We instead ran Seeker on a single CPU, one genome at a time. DBSCAN-SWA had the next highest mean peak memory of 8.76 GB. However, several runs required nearly 35 GB peak memory. Memory requirements were lowest for VirSorter with 287 MB mean peak memory, and mean peak memory usage for Phage Finder, Phigaro, PhiSpy, ProphET, VIBRANT, and Virsorter2 were all under 1 GB. Apart from Seeker and the DBSCAN-SWA outliers, there were no situations where the peak memory usage would prevent the analysis from completing on a modest personal computer. At larger-scales, Phage Finder, Phigaro, PhiSpy, ProphET, VIBRANT, VirSorter, and VirSorter2 have an advantage in terms of peak memory usage.</p>
                <p>Another important consideration for large-scale analyses are the file sizes that are generated by the different tools. Large output file sizes can place considerable strain on storage capacities, and large numbers of read and write operations can severely impact the performance of a system or HPC cluster for all users. Total file writes for the default files (in MB, including temporary files) are shown in 
                    <xref ref-type="fig" rid="f2">Figure 2c</xref> and the final disk usage for all genomes for each tool is shown in 
                    <xref ref-type="fig" rid="f2">Figure 2d</xref>; these are also summarised in 
                    <xref ref-type="table" rid="T4">Table 3</xref>. VirSorter, DBSCAN-SWA, VIBRANT, ProphET, and VirSorter2 performed the most write operations. The other tools performed similarly well and have a clear advantage at scale as they perform far fewer disk writes. VirSorter and DBSCAN-SWA removed most of their generated files, however, the final disk usage for these tools were still the highest at 5.36 and 2.96 GB respectively. Disk usage for PhageBoost and PhiSpy was by far the lowest at 0.14 and 15 MB respectively.</p>
            </sec>
            <sec id="sec11">
                <title>Caveats</title>
                <p>Every bioinformatics comparison involves many biases. In this comparison, PhiSpy performs well, but we developed PhiSpy and many of the gold-standard genomes were extensively used during its development to optimize the algorithm. VirSorter and VirSorter2 were primarily developed to identify viral regions in metagenomes rather than prophages in bacterial genomes&#x2014;although they have been used for that e.g. in 
                    <xref ref-type="bibr" rid="ref14">Glickman et al. (2020)</xref>&#x2014;and filtering VirSorter and VirSorter2 hits with CheckV (
                    <xref ref-type="bibr" rid="ref26">Nayfach et al., 2021</xref>) is recommended. Likewise, Seeker was designed for classifying short sequences as either phage or non-phage. It was trained on phages, not prophages, and was not originally intended for classifying prophage regions in complete genomes. Furthermore, the current database of prophage annotations is heavily skewed towards more heavily studied phyla, and we show that there can be significant differences in performance depending on taxonomy. By openly providing the Prophage Prediction Comparison framework, creating a framework to install and test different software, and defining a straightforward approach to labelling prophages in GenBank files, we hope to expand our gold-standard set of genomes and mitigate many of our biases. We welcome the addition of other genomes (especially from beyond the Proteobacteria/Bacteroidetes/Firmicutes that are overrepresented in our gold-standard database).</p>
                <p>Recent developments in alternative approaches to predict prophages, including mining phage-like genes from metagenomes and then mapping them to complete genomes (
                    <xref ref-type="bibr" rid="ref26">Nayfach et al., 2021</xref>) and using short-read mapping to predict prophage regions from complete bacterial genomes (
                    <xref ref-type="bibr" rid="ref21">Kieft &amp; Anantharaman, 2021</xref>) have the potential to generate many more ground-truth prophage observations. However, both approaches are limited, as they identify prophages that are active, but not quiescent prophage regions. Thus, they will provide useful true positive datasets for prophage prediction algorithms but may not provide accurate true negative datasets.</p>
            </sec>
        </sec>
        <sec id="sec12" sec-type="conclusions">
            <title>Conclusions</title>
            <p>Establishing a gold-standard dataset of prophage and associated metrics is critical to enable a robust comparison of prophage prediction tools. In particular, the current comparison suggests that most tools perform reasonably well by themselves to detect phage-like regions in complete bacterial genomes, and most of the differences between tools stem from different trade-offs between precision and recall with default parameters and different compute resource requirements. Specifically, using the gold-standard dataset and the metrics defined here, PhiSpy, VIBRANT, and Phigaro were the best performing prophage prediction tools for f
                <sub>1</sub> score. Phage Finder performs well in terms of precision at the expense of false-negatives, whereas VirSorter, VirSorter2, DBSCAN-SWA and PhageBoost perform better for recall at the expense of false-positives. Currently, Seeker, DBSCAN-SWA, VirSorter, and to a lesser extent VirSorter2 are not as well suited for large-scale identification of prophages from complete bacterial genomes when compared to the other tools, and would require using custom cutoffs and/or post-processing predictions with another tool such as CheckV. In terms of runtime performance, PhiSpy and Phigaro were among the best in every metric, and ProphET and VIBRANT performed well in most metrics. These comparisons are, however, relying on expert curation of a limited number of genomes. More genomes with manually curated prophage annotations are thus needed as well as a larger number and diversity of experimentally-verified prophages, and we anticipate that these benchmarks will change with the addition of new genomes, the addition of new tools, and as the tools are updated over time. We intentionally designed the current framework to be easily amendable and expanded, and developers are strongly encouraged to contribute by adding or updating their tool and adding their manually curated and/or experimentally verified genomes to be included in the benchmarking. Users are strongly encouraged to check the GitHub repository for the latest results before making any decisions on which prophage prediction tool would best suit their needs.</p>
        </sec>
        <sec id="sec13">
            <title>Author contributions</title>
            <p>RAE conceived of the study; KM and PD generated the initial gold-standard set and MJR, SKG, LI, and EP contributed to the current gold-standard set; RAE and MJR created the framework; RAE, MJR, SR, MM, and JB performed the analysis. All authors contributed to the manuscript writing.</p>
        </sec>
        <sec id="sec4.1">
            <title>Funding information</title>
            <p>This work supported by the National Institute Of Diabetes And Digestive And Kidney Diseases of the National Institutes of Health under Award Number RC2DK116713 to RAE. The support provided by Flinders University for HPC research resources is acknowledged. The work conducted by the U.S. Department of Energy Joint Genome Institute (SR), a DOE Office of Science User Facility, is supported by the Office of Science of the U.S. Department of Energy under contract no. DE-AC02-05CH11231.</p>
        </sec>
        <sec id="sec14">
            <title>Data availability</title>
            <sec id="sec15">
                <title>Underlying data</title>
                <p>Zenodo: linsalrob/ProphagePredictionComparisons: Review release. 
                    <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.4739878">https://doi.org/10.5281/zenodo.4739878</ext-link>. (
                    <xref ref-type="bibr" rid="ref31">Roach &amp; Edwards, 2021b</xref>).</p>
                <p>This project contains the following underlying data;
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>snakefiles/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Snakemake pipeline files for running each of the prophage prediction tools against the gold-standard prophage-annotated genomes</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>rules/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Snakemake files with generic rules used by one or more of the Snakemake pipelines</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>conda_environments/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Configuration files for creating conda environments for use in the Snakemake pipelines</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>data/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Any custom small datasets required by the prophage prediction tools</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>scripts/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Perl and Python scripts that are used in the Snakemake pipelines for performing various tasks</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>ProphagePredictionsLib/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Library files required by the Perl and Python scripts</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>jupyter_notebooks/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Summary metric tables for all of the tools, and example Jupyter notebook for producing the comparison figures</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>img/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Example figures generated by the Jupyter notebook</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>LICENCE</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;Licence file for the github repository</p>
                                </list-item>
                            </list>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>Supplementary/</p>
                            <list list-type="bullet">
                                <list-item>
                                    <p>&#x00ba;&#x2002;SupplementaryTables.xlsx</p>
                                    <list list-type="bullet">
                                        <list-item>
                                            <label>&#x25aa;</label>
                                            <p>(Sheet 1) Table S1. Genomes provided in the gold-standard library with manually curated prophages</p>
                                        </list-item>
                                    </list>
                                </list-item>
                                <list-item>
                                    <p>&#x00ba;&#x2002;FigureS1.png</p>
                                    <list list-type="bullet">
                                        <list-item>
                                            <label>&#x25aa;</label>
                                            <p>Figure S1. False positive comparison</p>
                                        </list-item>
                                    </list>
                                </list-item>
                                <list-item>
                                    <p>&#x00ba;&#x2002;FigureS2.png</p>
                                    <list list-type="bullet">
                                        <list-item>
                                            <label>&#x25aa;</label>
                                            <p>Figure S2a. F1 scores by genus for each tool</p>
                                        </list-item>
                                        <list-item>
                                            <label>&#x25aa;</label>
                                            <p>Figure S2b. F1 score distribution for each genus for all tools</p>
                                        </list-item>
                                    </list>
                                </list-item>
                                <list-item>
                                    <p>&#x00ba;&#x2002;prophageAnnotation.md</p>
                                    <list list-type="bullet">
                                        <list-item>
                                            <label>&#x25aa;</label>
                                            <p>The guidelines for manually curating prophage annotations</p>
                                        </list-item>
                                    </list>
                                </list-item>
                            </list>
                        </list-item>
                    </list>
                </p>
                <p>Underlying data and the prophage annotated GenBank files are also available at GitHub: Comparisons of multiple different prophage predictions 
                    <ext-link ext-link-type="uri" xlink:href="https://github.com/linsalrob/ProphagePredictionComparisons/tree/v0.1-beta">https://github.com/linsalrob/ProphagePredictionComparisons/tree/v0.1-beta</ext-link> (
                    <xref ref-type="bibr" rid="ref31">Roach &amp; Edwards, 2021a</xref>). Please note that you will need Git (
                    <ext-link ext-link-type="uri" xlink:href="http://git-scm.com">git-scm.com</ext-link>) and Git LFS (
                    <ext-link ext-link-type="uri" xlink:href="http://git-lfs.github.com">git-lfs.github.com</ext-link>) to retrieve the GenBank files from the GitHub repository. Support for these files and framework pipelines are available via GitHub 
                    <italic toggle="yes">issues.</italic>
                </p>
            </sec>
            <sec id="sec16">
                <title>Extended data</title>
                <p>Zenodo: Extended data for &#x2018;Philympics 2021: Prophage Predictions Perplex Programs&#x2019;: 
                    <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.4739878">https://doi.org/10.5281/zenodo.4739878</ext-link>.</p>
                <p>This project contains the following extended data:</p>
                <p>
                    <bold>SupplementaryTables.xlsx:</bold>
                </p>
                <p>
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>
                                <bold>Table S1. Genomes provided in the gold-standard library with manually curated prophages</bold>
                            </p>
                        </list-item>
                    </list>
                </p>
                <p>
                    <bold>FigureS1.png:</bold>
                </p>
                <p>
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>
                                <bold>Figure S1. False positive comparison.</bold> Violin plots for each tool show &#x2018;False Positives&#x2019; as the number of genes incorrectly labelled prophage genes in each genome. Less is better.</p>
                        </list-item>
                    </list>
                </p>
                <p>
                    <bold>FigureS2.png:</bold>
                </p>
                <p>
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>
                                <bold>Figure S2a. F1 scores by genus for each tool.</bold> F1 scores are shown for each genome grouped and coloured by genus and separated by prophage caller.</p>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>
                                <bold>Figure S2b. F1 score distribution for each genus for all tools. </bold> Boxplots of F1 scores for each genome over all tools, grouped and coloured by genus. P-values and significance are indicated for Mann-Whitney tests that were performed to determine if a genus had significantly higher or lower F1 scores when compared to the other genera.</p>
                        </list-item>
                    </list>
                </p>
                <p>
                    <bold>prophageAnnotation.md</bold>
                </p>
                <p>
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>The guidelines for manually curating prophage annotations.</p>
                        </list-item>
                    </list>
                </p>
            </sec>
        </sec>
    </body>
    <back>
        <ref-list>
            <title>References</title>
            <ref id="ref39">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Abedon</surname>
                            <given-names>ST</given-names>
                        </name>
</person-group>:
                    <article-title>Bacteriophage secondary infection.</article-title>
                    <source>

                        <italic toggle="yes">Virologica Sinica.</italic>
</source>
                    <year>2015</year>;<volume>30</volume>:<fpage>3</fpage>&#x2013;<lpage>10</lpage>.
                    <pub-id pub-id-type="pmid">25595214</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s12250-014-3547-2</pub-id>
                </mixed-citation>
            </ref>
            <ref id="re40">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Abedon</surname>
                            <given-names>ST</given-names>
                        </name>
</person-group>:
                    <article-title>Look Who&#x2019;s Talking: T-Even Phage Lysis Inhibition, the Granddaddy of Virus-Virus Intercellular Communication Research.</article-title>
                    <source>

                        <italic toggle="yes">Viruses.</italic>
</source>
                    <year>2019</year>;<volume>11</volume>:<fpage>951</fpage>.
                    <pub-id pub-id-type="pmid">31623057</pub-id>
                    <pub-id pub-id-type="doi">10.3390/v11100951</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref1">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Akhter</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Aziz</surname>
                            <given-names>RK</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Edwards</surname>
                            <given-names>RA</given-names>
                        </name>
</person-group>:
                    <article-title>PhiSpy: a novel algorithm for finding prophages in bacterial genomes that combines similarity- and composition-based strategies.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic Acids Res.</italic>
</source>
                    <year>2012</year>;<volume>40</volume>:<fpage>e126</fpage>&#x2013;<lpage>e126</lpage>.
                    <pub-id pub-id-type="pmid">22584627</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gks406</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3439882</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Amgarten</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Braga</surname>
                            <given-names>LPP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Da Silva</surname>
                            <given-names>AM</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>MARVEL, a Tool for Prediction of Bacteriophage Sequences in Metagenomic Bins.</article-title>
                    <source>

                        <italic toggle="yes">Front Genet.</italic>
</source>
                    <year>2018</year>;<volume>9</volume>.
                    <pub-id pub-id-type="pmid">30131825</pub-id>
                    <pub-id pub-id-type="doi">10.3389/fgene.2018.00304</pub-id>
                    <pub-id pub-id-type="pmcid">PMC6090037</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Arndt</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Grant</surname>
                            <given-names>JR</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Marcu</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>PHASTER: a better, faster version of the PHAST phage search tool.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic Acids Res.</italic>
</source>
                    <year>2016</year>;<volume>44</volume>:<fpage>W16</fpage>&#x2013;<lpage>W21</lpage>.
                    <pub-id pub-id-type="pmid">27141966</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gkw387</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4987931</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Aziz</surname>
                            <given-names>RK</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bartels</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Best</surname>
                            <given-names>AA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The RAST Server: Rapid Annotations using Subsystems Technology.</article-title>
                    <source>

                        <italic toggle="yes">BMC Genomics.</italic>
</source>
                    <year>2008</year>;<volume>9</volume>:<fpage>75</fpage>.
                    <pub-id pub-id-type="pmid">18261238</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2164-9-75</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2265698</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref5">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Breitbart</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>Marine Viruses: Truth or Dare.</article-title>
                    <source>

                        <italic toggle="yes">Ann Rev Mar Sci.</italic>
</source>
                    <year>2012</year>;<volume>4</volume>:<fpage>425</fpage>&#x2013;<lpage>448</lpage>.
                    <pub-id pub-id-type="pmid">22457982</pub-id>
                    <pub-id pub-id-type="doi">10.1146/annurev-marine-120709-142805</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Br&#x00fc;ssow</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Canchaya</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hardt</surname>
                            <given-names>W-D</given-names>
                        </name>
</person-group>:
                    <article-title>Phages and the Evolution of Bacterial Pathogens: from Genomic Rearrangements to Lysogenic Conversion.</article-title>
                    <source>

                        <italic toggle="yes">Microbiol Mol Biol Rev.</italic>
</source>
                    <year>2004</year>;<volume>68</volume>:<fpage>560</fpage>&#x2013;<lpage>602</lpage>.
                    <pub-id pub-id-type="pmid">15353570</pub-id>
                    <pub-id pub-id-type="doi">10.1128/MMBR.68.3.560-602.2004</pub-id>
                    <pub-id pub-id-type="pmcid">PMC515249</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref8">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Campbell</surname>
                            <given-names>AM</given-names>
                        </name>
</person-group>:
                    <article-title>Preferential Orientation Preferential Orientation of Natural Lambdoid Prophages and Bacterial Chromosome Organization.</article-title>
                    <source>

                        <italic toggle="yes">Theor Popul Biol.</italic>
</source>
                    <year>2002</year>;<volume>61</volume>:<fpage>503</fpage>&#x2013;<lpage>507</lpage>.
                    <pub-id pub-id-type="pmid">12167370</pub-id>
                    <pub-id pub-id-type="doi">10.1006/tpbi.2002.1604</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref9">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Canchaya</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Proux</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Fournous</surname>
                            <given-names>G</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prophage Genomics.</article-title>
                    <source>

                        <italic toggle="yes">Microbiol Mol Biol Rev.</italic>
</source>
                    <year>2003</year>;<volume>67</volume>:<fpage>238</fpage>&#x2013;<lpage>276</lpage>.
                    <pub-id pub-id-type="pmid">12794192</pub-id>
                    <pub-id pub-id-type="doi">10.1128/MMBR.67.2.238-276.2003</pub-id>
                    <pub-id pub-id-type="pmcid">PMC156470</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref10">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Casjens</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>Prophages and bacterial genomics: what have we learned so far?</article-title>
                    <source>

                        <italic toggle="yes">Mol Microbiol.</italic>
</source>
                    <year>2003</year>;<volume>49</volume>:<fpage>277</fpage>&#x2013;<lpage>300</lpage>.
                    <pub-id pub-id-type="pmid">12886937</pub-id>
                    <pub-id pub-id-type="doi">10.1046/j.1365-2958.2003.03580.x</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref11">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Dutilh</surname>
                            <given-names>BE</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Cassman</surname>
                            <given-names>N</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mcnair</surname>
                            <given-names>K</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A highly abundant bacteriophage discovered in the unknown sequences of human faecal metagenomes.</article-title>
                    <source>

                        <italic toggle="yes">Nat Commun.</italic>
</source>
                    <year>2014</year>;<volume>5</volume>:<fpage>4498</fpage>.
                    <pub-id pub-id-type="pmid">25058116</pub-id>
                    <pub-id pub-id-type="doi">10.1038/ncomms5498</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4111155</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref12">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Fouts</surname>
                            <given-names>DE</given-names>
                        </name>
</person-group>:
                    <article-title>Phage_Finder: Automated identification and classification of prophage regions in complete bacterial genome sequences.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic Acids Res.</italic>
</source>
                    <year>2006</year>;<volume>34</volume>:<fpage>5839</fpage>&#x2013;<lpage>5851</lpage>.
                    <pub-id pub-id-type="pmid">17062630</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gkl732</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1635311</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref13">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gan</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Si</surname>
                            <given-names>Y</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>DBSCAN-SWA: an integrated tool for rapid prophage detection and annotation.</article-title>
                    <source>

                        <italic toggle="yes">bioRxiv.</italic>
</source>
                    <year>2020</year>;<fpage>2020.07.12.199018</fpage>.
                    <pub-id pub-id-type="doi">10.1101/2020.07.12.199018</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref14">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Glickman</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kammlade</surname>
                            <given-names>SM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hasan</surname>
                            <given-names>NA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Characterization of integrated prophages within diverse species of clinical nontuberculous mycobacteria.</article-title>
                    <source>

                        <italic toggle="yes">Virol J.</italic>
</source>
                    <year>2020</year>;<volume>17</volume>:<fpage>124</fpage>.
                    <pub-id pub-id-type="pmid">32807206</pub-id>
                    <pub-id pub-id-type="doi">10.1186/s12985-020-01394-y</pub-id>
                    <pub-id pub-id-type="pmcid">PMC7433156</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref15">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Grazziotin</surname>
                            <given-names>AL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Koonin</surname>
                            <given-names>EV</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kristensen</surname>
                            <given-names>DM</given-names>
                        </name>
</person-group>:
                    <article-title>Prokaryotic Virus Orthologous Groups (pVOGs): a resource for comparative genomics and protein family annotation.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic acids res.</italic>
</source>
                    <year>2017</year>;<volume>45</volume>:<fpage>D491</fpage>&#x2013;<lpage>D498</lpage>.
                    <pub-id pub-id-type="pmid">27789703</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gkw975</pub-id>
                    <pub-id pub-id-type="pmcid">PMC5210652</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref16">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Grigoriev</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Analyzing genomes with cumulative skew diagrams.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic Acids Res.</italic>
</source>
                    <year>1998</year>;<volume>26</volume>:<fpage>2286</fpage>&#x2013;<lpage>2290</lpage>.
                    <pub-id pub-id-type="pmid">9580676</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/26.10.2286</pub-id>
                    <pub-id pub-id-type="pmcid">PMC147580</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref17">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gr&#x00fc;ning</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Dale</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sj&#x00f6;din</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Bioconda: sustainable and comprehensive software distribution for the life sciences.</article-title>
                    <source>

                        <italic toggle="yes">Nat Methods.</italic>
</source>
                    <year>2018</year>;<volume>15</volume>:<fpage>475</fpage>&#x2013;<lpage>476</lpage>.
                    <pub-id pub-id-type="pmid">29967506</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41592-018-0046-7</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref18">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Guo</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bolduc</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zayed</surname>
                            <given-names>AA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>VirSorter2: a multi-classifier, expert-guided approach to detect diverse DNA and RNA viruses.</article-title>
                    <source>

                        <italic toggle="yes">Microbiome.</italic>
</source>
                    <year>2021</year>;<volume>9</volume>:<fpage>37</fpage>.
                    <pub-id pub-id-type="pmid">33522966</pub-id>
                    <pub-id pub-id-type="doi">10.1186/s40168-020-00990-y</pub-id>
                    <pub-id pub-id-type="pmcid">PMC7852108</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref19">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Hyatt</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>G-L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Locascio</surname>
                            <given-names>PF</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prodigal: prokaryotic gene recognition and translation initiation site identification.</article-title>
                    <source>

                        <italic toggle="yes">BMC bioinformatics.</italic>
</source>
                    <year>2010</year>;<volume>11</volume>:<fpage>119</fpage>&#x2013;<lpage>119</lpage>.
                    <pub-id pub-id-type="pmid">20211023</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-11-119</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2848648</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref20">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kang</surname>
                            <given-names>HS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mcnair</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Cuevas</surname>
                            <given-names>DA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prophage genomics reveals patterns in phage genome organization and replication.</article-title>
                    <source>

                        <italic toggle="yes">bioRxiv.</italic>
</source>
                    <year>2017</year>:<fpage>114819</fpage>.
                    <pub-id pub-id-type="doi">10.1101/114819</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref21">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kieft</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Anantharaman</surname>
                            <given-names>K</given-names>
                        </name>
</person-group>:
                    <article-title>Deciphering active prophages from metagenomes.</article-title>
                    <source>

                        <italic toggle="yes">bioRxiv.</italic>
</source>
                    <year>2021</year>:<fpage>2021.01.29.428894</fpage>.
                    <pub-id pub-id-type="doi">10.1101/2021.01.29.428894</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref22">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kieft</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>Z</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Anantharaman</surname>
                            <given-names>K</given-names>
                        </name>
</person-group>:
                    <article-title>VIBRANT: automated recovery, annotation and curation of microbial viruses, and evaluation of viral community function from genomic sequences.</article-title>
                    <source>

                        <italic toggle="yes">Microbiome.</italic>
</source>
                    <year>2020</year>;<volume>8</volume>:<fpage>90</fpage>.
                    <pub-id pub-id-type="pmid">32522236</pub-id>
                    <pub-id pub-id-type="doi">10.1186/s40168-020-00867-0</pub-id>
                    <pub-id pub-id-type="pmcid">PMC7288430</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref23">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>K&#x00f6;ster</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Rahmann</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>Snakemake&#x2014;a scalable bioinformatics workflow engine.</article-title>
                    <source>

                        <italic toggle="yes">Bioinformatics.</italic>
</source>
                    <year>2012</year>;<volume>28</volume>:<fpage>2520</fpage>&#x2013;<lpage>2522</lpage>.
                    <pub-id pub-id-type="pmid">29788404</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/bty350</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref24">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Lima-Mendez</surname>
                            <given-names>G</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Van Helden</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Toussaint</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prophinder: a computational tool for prophage prediction in prokaryotic genomes.</article-title>
                    <source>

                        <italic toggle="yes">Bioinformatics.</italic>
</source>
                    <year>2008</year>;<volume>24</volume>:<fpage>863</fpage>&#x2013;<lpage>865</lpage>.
                    <pub-id pub-id-type="pmid">18238785</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btn043</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref25">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Mcnair</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Dinsdale</surname>
                            <given-names>EA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>PHANOTATE: a novel approach to gene identification in phage genomes.</article-title>
                    <source>

                        <italic toggle="yes">Bioinformatics.</italic>
</source>
                    <year>2019</year>;<volume>35</volume>:<fpage>4537</fpage>&#x2013;<lpage>4542</lpage>.
                    <pub-id pub-id-type="pmid">31329826</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btz265</pub-id>
                    <pub-id pub-id-type="pmcid">PMC6853651</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref26">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Nayfach</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Camargo</surname>
                            <given-names>AP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Schulz</surname>
                            <given-names>F</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>CheckV assesses the quality and completeness of metagenome-assembled viral genomes.</article-title>
                    <source>

                        <italic toggle="yes">Nat Biotechnol.</italic>
</source>
                    <year>2021</year>;<volume>39</volume>:<fpage>578</fpage>&#x2013;<lpage>585</lpage>.
                    <pub-id pub-id-type="pmid">33349699</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41587-020-00774-7</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8116208</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref27">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Niu</surname>
                            <given-names>Q</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Peng</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>X</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>LysoPhD: predicting functional prophages in bacterial genomes from high-throughput sequencing.</article-title>
                    <source>

                        <italic toggle="yes">2019 IEEE International Conference on Bioinformatics and Biomedicine (BIBM), 18-21 Nov. 2019.</italic>
</source>
                    <year>2019</year>;<fpage>1</fpage>&#x2013;<lpage>5</lpage>.
                    <pub-id pub-id-type="doi">10.1109/BIBM47256.2019.8983280</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref28">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Noguchi</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Taniguchi</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Itoh</surname>
                            <given-names>T</given-names>
                        </name>
</person-group>:
                    <article-title>MetaGeneAnnotator: detecting species-specific patterns of ribosomal binding site for precise gene prediction in anonymous prokaryotic and phage genomes.</article-title>
                    <source>

                        <italic toggle="yes">DNA res.</italic>
</source>
                    <year>2008</year>;<volume>15</volume>:<fpage>387</fpage>&#x2013;<lpage>396</lpage>.
                    <pub-id pub-id-type="pmid">18940874</pub-id>
                    <pub-id pub-id-type="doi">10.1093/dnares/dsn027</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2608843</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref29">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Reis-Cunha</surname>
                            <given-names>JL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bartholomeu</surname>
                            <given-names>DC</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Manson</surname>
                            <given-names>AL</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>ProphET, prophage estimation tool: A stand-alone prophage sequence prediction tool with self-updating reference database.</article-title>
                    <source>

                        <italic toggle="yes">PLOS ONE.</italic>
</source>
                    <year>2019</year>;<volume>14</volume>:<fpage>e0223364</fpage>.
                    <pub-id pub-id-type="pmid">31577829</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0223364</pub-id>
                    <pub-id pub-id-type="pmcid">PMC6774505</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref41">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rezaei Javan</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ramos-Sevillano</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Akter</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prophages and satellite prophages are widespread in Streptococcus and may play a role in pneumococcal pathogenesis.</article-title>
                    <source>

                        <italic toggle="yes">Nat Commun.</italic>
</source>
                    <year>2019</year>;<volume>10</volume>:<fpage>4852</fpage>.</mixed-citation>
            </ref>
            <ref id="ref30">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Roach</surname>
                            <given-names>MJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Edwards</surname>
                            <given-names>RA</given-names>
                        </name>
</person-group>:
                    <article-title>linsalrob/ProphagePredictionComparisons [Online].</article-title>
                    <source>

                        <italic toggle="yes">GitHub</italic>
</source>.<year>2021a</year>. [Accessed].
                    <ext-link ext-link-type="uri" xlink:href="https://github.com/linsalrob/ProphagePredictionComparisons/">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref31">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Roach</surname>
                            <given-names>MJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Edwards</surname>
                            <given-names>RA</given-names>
                        </name>
</person-group>:
                    <article-title>linsalrob/ProphagePredictionComparisons: Review release (Version v0.1).</article-title>
                    <source>

                        <italic toggle="yes">Zenodo.</italic>
</source>
                    <year>2021b</year>.</mixed-citation>
            </ref>
            <ref id="ref32">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Roux</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Enault</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hurwitz</surname>
                            <given-names>BL</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>VirSorter: mining viral signal from microbial genomic data.</article-title>
                    <source>

                        <italic toggle="yes">PeerJ.</italic>
</source>
                    <year>2015</year>;<volume>3</volume>:<fpage>e985</fpage>.
                    <pub-id pub-id-type="pmid">26038737</pub-id>
                    <pub-id pub-id-type="doi">10.7717/peerj.985</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4451026</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref33">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Seemann</surname>
                            <given-names>T</given-names>
                        </name>
</person-group>:
                    <article-title>Prokka: rapid prokaryotic genome annotation.</article-title>
                    <source>

                        <italic toggle="yes">Bioinformatics.</italic>
</source>
                    <year>2014</year>;<volume>30</volume>:<fpage>2068</fpage>&#x2013;<lpage>2069</lpage>.
                    <pub-id pub-id-type="pmid">24642063</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btu153</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref34">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sir&#x00e9;n</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Millard</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Petersen</surname>
                            <given-names>B</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Rapid discovery of novel prophages using biological feature engineering and machine learning.</article-title>
                    <source>

                        <italic toggle="yes">NAR Genom Bioinform.</italic>
</source>
                    <year>2021</year>;<fpage>3</fpage>.
                    <pub-id pub-id-type="doi">10.1093/nargab/lqaa109</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref35">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Song</surname>
                            <given-names>W</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sun</surname>
                            <given-names>H-X</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>C</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Prophage Hunter: an integrative hunting tool for active prophages.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic Acids Res.</italic>
</source>
                    <year>2019</year>;<volume>47</volume>:<fpage>W74</fpage>&#x2013;<lpage>W80</lpage>.
                    <pub-id pub-id-type="pmid">31114893</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gkz380</pub-id>
                    <pub-id pub-id-type="pmcid">PMC6602508</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref36">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sousa</surname>
                            <given-names>ALD</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mau&#x00e9;s</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lobato</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>PhageWeb &#x2013; Web Interface for Rapid Identification and Characterization of Prophages in Bacterial Genomes.</article-title>
                    <source>

                        <italic toggle="yes">Fron Genet.</italic>
</source>
                    <year>2018</year>;<volume>9</volume>.
                    <pub-id pub-id-type="pmid">30619469</pub-id>
                    <pub-id pub-id-type="doi">10.3389/fgene.2018.00644</pub-id>
                    <pub-id pub-id-type="pmcid">PMC6305541</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref37">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Starikova</surname>
                            <given-names>EV</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tikhonova</surname>
                            <given-names>PO</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Prianichnikov</surname>
                            <given-names>NA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Phigaro: high-throughput prophage sequence annotation.</article-title>
                    <source>

                        <italic toggle="yes">Bioinformatics.</italic>
</source>
                    <year>2020</year>;<volume>36</volume>:<fpage>3882</fpage>&#x2013;<lpage>3884</lpage>.
                    <pub-id pub-id-type="pmid">32311023</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btaa250</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref38">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Terzian</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Olo Ndela</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Galiez</surname>
                            <given-names>C</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>PHROG: families of prokaryotic virus proteins clustered using remote homology. [Online].</article-title>
                    <year>2021</year>. [Accessed June 2021].
                    <ext-link ext-link-type="uri" xlink:href="https://phrogs.lmge.uca.fr/">Reference Source</ext-link>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report130220">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.124379.r130220</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Anantharaman</surname>
                        <given-names>Karthik</given-names>
                    </name>
                    <xref ref-type="aff" rid="r130220a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-9584-2491</uri>
                </contrib>
                <contrib contrib-type="author">
                    <name>
                        <surname>Kieft</surname>
                        <given-names>Kristopher</given-names>
                    </name>
                    <xref ref-type="aff" rid="r130220a1">1</xref>
                    <role>Co-referee</role>
                </contrib>
                <aff id="r130220a1">
                    <label>1</label>Department of Bacteriology, University of Wisconsin-Madison, Madison, WI, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>23</day>
                <month>5</month>
                <year>2022</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2022 Anantharaman K and Kieft K</copyright-statement>
                <copyright-year>2022</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport130220" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.54449.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>Our only remaining concern is still with the manual validation and curation of the gold standard dataset (i.e., Methods). We appreciate that efforts have been made to provide a GitHub repo that outlines the methods completed by the authors, but it is still lacking in detail. The guidelines provided are highly generalized guidelines and read as notes rather than methods. What we look for in methods are an ability to replicate the results or at least details of how the study was performed. Focusing on the GitHub repo, there is an abundance of ambiguous information that makes the curation of a gold standard dataset, and the cutoffs used by the authors in this publication, impossible to follow. Please provide more details of the actual methods used.</p>
            <p> </p>
            <p> Here are some examples, though they are not limited to these: 
                <list list-type="bullet">
                    <list-item>
                        <p>&#x201c;Start by identifying proteins with sequence homology to known viral (phage) proteins&#x201d;. What ORF prediction tool was used? What annotation tool and database was used? What cutoffs were used?</p>
                    </list-item>
                    <list-item>
                        <p>&#x201c;Tracks of hypothetical proteins&#x201d; How long is a &#x2018;track&#x2019;? 10 proteins, 20 proteins? a specific number or example would be ideal here. The number of hypothetical annotations is also entirely dependent on the database or number of databases used to annotate.</p>
                    </list-item>
                    <list-item>
                        <p>&#x201c;Local changes in GC% content over the potential prophage region&#x201d; What constitutes a change? 2%, 5%, 10% GC change? Over what size of windows?</p>
                    </list-item>
                    <list-item>
                        <p>Once a candidate region is observed manual inspection includes searching for the presence of 'the most conserved proteins' a prophage should have or we expect to find&#x201d; Is there any guidelines on this?</p>
                    </list-item>
                    <list-item>
                        <p>&#x201c;Presence of direct repeats surrounding potential prophage region (indicating potential attachment sites)&#x201d;. Is there any particular upper and lower bound lengths for the repeats?</p>
                    </list-item>
                    <list-item>
                        <p>&#x201c;an additional search with the HHpred is performed&#x201d;. Methods require specific commands used and/or workflows, plus tool versions. Some specific examples would be good to provide.</p>
                    </list-item>
                    <list-item>
                        <p>&#x201c;Try to find nearly identical prophage region in a different bacterial genome". What is considered as nearly identical? &gt;80%, &gt;90% nucleotide identity?</p>
                    </list-item>
                    <list-item>
                        <p>&#x201c;Take just the parts surrounding the candidate prophage region, join them into a single continuous sequence and search NT database&#x201d;. What does &#x2018;just the parts&#x2019; mean? Is this a nucleotide region? How long of a region?</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Metagenomics, Microbial and Phage ecology</p>
            <p>We confirm that we have read this submission and believe that we have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however we have significant reservations, as outlined above.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report130221">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.124379.r130221</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Nobrega</surname>
                        <given-names>Franklin</given-names>
                    </name>
                    <xref ref-type="aff" rid="r130221a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-8238-1083</uri>
                </contrib>
                <aff id="r130221a1">
                    <label>1</label>School of Biological Sciences, Faculty of Environmental and Life Sciences, University of Southampton, Southampton, UK</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>25</day>
                <month>4</month>
                <year>2022</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2022 Nobrega F</copyright-statement>
                <copyright-year>2022</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport130221" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.54449.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>I have no further comments to make.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>No</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Phage biology, phage-host interactions</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report91781">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.57937.r91781</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Anantharaman</surname>
                        <given-names>Karthik</given-names>
                    </name>
                    <xref ref-type="aff" rid="r91781a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-9584-2491</uri>
                </contrib>
                <contrib contrib-type="author">
                    <name>
                        <surname>Kieft</surname>
                        <given-names>Kristopher</given-names>
                    </name>
                    <xref ref-type="aff" rid="r91781a1">1</xref>
                    <role>Co-referee</role>
                </contrib>
                <aff id="r91781a1">
                    <label>1</label>Department of Bacteriology, University of Wisconsin-Madison, Madison, WI, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>31</day>
                <month>8</month>
                <year>2021</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2021 Anantharaman K and Kieft K</copyright-statement>
                <copyright-year>2021</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport91781" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.54449.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>reject</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>This manuscript by Roach
                <italic> et al. </italic>describes the creation and benchmarking of a gold standard bacterial dataset that can be used for prediction of prophages from bacterial genomes. Additionally, they also benchmark seven currently available software for prediction of prophages. Overall, this manuscript and the datasets provided represent a valuable resource to the community that can be used widely. We do have some comments that in our opinion can improve the manuscript, the benchmarking and the utility of the gold standard dataset that the authors aim to to provide to the community.</p>
            <p> </p>
            <p> </p>
            <p> 
                <bold>Introduction:&#x00a0;</bold> 
                <list list-type="bullet">
                    <list-item>
                        <p>
                            <italic>Last paragraph</italic>: the reasoning for this study is sound and accurate. Though the usage of the term &#x201c;annotated&#x201d; is slightly ambiguous here, and throughout the paper, because it is meant to designate either prophage locations or protein/gene annotations.</p>
                    </list-item>
                </list> </p>
            <p> 
                <bold>Methods:</bold>
            </p>
            <p> </p>
            <p> 
                <italic>First sentence</italic>: the actual method of &#x201c;manually curated prophage annotations was generated&#x201d; is never explained. 
                <list list-type="bullet">
                    <list-item>
                        <p>What method was used? How were prophages manually identified, annotated, and validated? To me, gold standard would imply each prophage has been experimentally validated.</p>
                    </list-item>
                    <list-item>
                        <p>Was there is specific method by which certain hosts were selected? I can see that there is &#x201c;Escherichia_coli_O157-H7&#x201d; and &#x201c;Escherichia_coli_O157-H7_EDL933&#x201d;. Why were so similar hosts chosen? Do they have significantly different prophages? There are multiple examples of this.</p>
                    </list-item>
                    <list-item>
                        <p>Many also appear to be common model organisms. How was diversity ensured? Is there a possibility to use organisms more widely distributed across the tree of life?</p>
                    </list-item>
                    <list-item>
                        <p>If this component is at all incorrect then the performance metrics, especially false positives if the prophage boundaries are wrong, will be biased.</p>
                    </list-item>
                    <list-item>
                        <p>How was Supplemental Table 2 generated?</p>
                    </list-item>
                </list> Overall, there is no indication as to how the gold standard dataset, the centerpiece of the paper, was actually generated. This does not significantly affect the study&#x2019;s results, but this information needs to be included before publication. For example, were the host sequences chosen at random from a database? Represent variable phylogenetic backgrounds? Source environments? Was prophage phylogeny taken into account? There are certainly questions left unanswered.&#x00a0;</p>
            <p> </p>
            <p> </p>
            <p> 
                <bold>Results:</bold> 
                <list list-type="bullet">
                    <list-item>
                        <p>
                            <italic>Prophage prediction performance</italic>: rather than only providing subjective &#x201c;best&#x201d; and &#x201c;worst&#x201d; designations, the numerical results should be provided too (e.g., accuracy of 0.9 +/- 0.1). Furthermore, what statistical metrics were used to designate &#x201c;best&#x201d; and &#x201c;worst&#x201d;?</p>
                    </list-item>
                    <list-item>
                        <p>
                            <italic>Caveats</italic>: The VIBRANT manuscript says that it also was developed to identify both temperate and virulent viral regions in metagenomes. FYI - we were not able to access the Supplementary datasets through the paper (but were able to retrieve them from bioRxiv).</p>
                    </list-item>
                </list> 
                <bold>Suggestions:</bold>
            </p>
            <p> </p>
            <p> Overall, this comparison framework would benefit from simple, minor additions. 
                <list list-type="bullet">
                    <list-item>
                        <p>Does the specific host (e.g., taxonomy) affect the results of prophage prediction for some tools? For tools that utilize HMM searches, the HMM databases may be biased towards certain groups (e.g., 
                            <italic>E. coli</italic> phages). We suggest that a comparison of precision/recall be compared to the source host.</p>
                    </list-item>
                    <list-item>
                        <p>Do the performance comparisons only take into account total prophage CDS predictions or also the completeness of predicted prophages? For example, identifying all prophages but only 50% of each of those prophages is different than identifying half of all prophages but 100% of each of those.</p>
                    </list-item>
                    <list-item>
                        <p>Is there any effect on hosts with multiple prophages? Are some tools affected by this?</p>
                    </list-item>
                    <list-item>
                        <p>Some tools will have predicted prophages that were not in the gold standard set (false positives). What measures were taken to ensure that none of these are real prophages that were missed within the manual curation?</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Metagenomics, Microbial and Phage ecology</p>
            <p>We confirm that we have read this submission and believe that we have an appropriate level of expertise to state that we do not consider it to be of an acceptable scientific standard, for reasons outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment8050-91781">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Roach</surname>
                            <given-names>Michael</given-names>
                        </name>
                        <aff>Flinders University, Australia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>The authors declare that there are no conflicts of interest.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>5</day>
                    <month>4</month>
                    <year>2022</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Thank you so much for reviewing our manuscript. We hope that version 2 address the concerns with the manuscript which we outline below: 
                    <list list-type="bullet">
                        <list-item>
                            <p>
                                <italic>Last paragraph: the reasoning for this study is sound and accurate. Though the usage of the term &#x201c;annotated&#x201d; is slightly ambiguous here, and throughout the paper, because it is meant to designate either prophage locations or protein/gene annotations.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> We agree that this could be clearer. We have updated all instances of &#x2018;annotations&#x2019; in the manuscript to explicitly refer to either prophage or gene annotations.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Methods:&#x00a0;</italic>
                                <italic>First sentence: the actual method of &#x201c;manually curated prophage annotations was generated&#x201d; is never explained. What method was used? How were prophages manually identified, annotated, and validated? To me, gold standard would imply each prophage has been experimentally validated.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> Experimentally validating all prohages by inducing them is not possible currently, as we do not know the signal for triggering the lytic cycles for all the prophages we know about. It is also not possible for elements such as cryptic phages, which may still offer a strong phrophage signal and represent true phage genome sequence, as they are not able to be induced. For cryptic prophages we believe it is still important to include these predictions as prophage annotations. The next best approach to a gold-standard library is to manually inspect and annotate the genomes. We have included the guidelines we use as supplementary material.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Was there is specific method by which certain hosts were selected? I can see that there is &#x201c;Escherichia_coli_O157-H7&#x201d; and &#x201c;Escherichia_coli_O157-H7_EDL933&#x201d;. Why were so similar hosts chosen? Do they have significantly different prophages? There are multiple examples of this. Many also appear to be common model organisms. How was diversity ensured? Is there a possibility to use organisms more widely distributed across the tree of life?</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> For PhiSpy&#x2019;s original development it was important to include multiple similar genomes with dissimilar numbers and positions of phages for training the algorithm. This selection bias is something that we have more recently been trying to address. We have earmarked many new diverse genomes for manual curation, and this update marks the inclusion of 10 new prophage annotated genomes from under-represented phyla. There is still a long way to go. Annotating prophages remains an extremely challenging task for underrepresented bacterial phyla, and it will remain so until our knowledgebase of known phages and phage proteins for these phyla improves.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>If this component is at all incorrect then the performance metrics, especially false positives if the prophage boundaries are wrong, will be biased.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> The current state is not perfect, rather, it is the best we can do right now. We agree with the sentiment, and it is why we have designed the repository around making it easy to add and refine tools, genomes and prophage annotations over time. However, we don&#x2019;t believe there are enough errors to significantly affect the outcome of the evaluation.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>How was Supplemental Table 2 generated?</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>It was originally compiled during manual curation. We now include a script for generating this table from the prophage-annotated GenBank files, as well as an updated table to include the new genomes.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Overall, there is no indication as to how the gold standard dataset, the centerpiece of the paper, was actually generated. This does not significantly affect the study&#x2019;s results, but this information needs to be included before publication. For example, were the host sequences chosen at random from a database? Represent variable phylogenetic backgrounds? Source environments? Was prophage phylogeny taken into account? There are certainly questions left unanswered. </italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>We hope the inclusion of our guidelines for manual curation and our recent progress has alleviated these concerns. There is still a long way to go to achieve a more diverse representation of prophages and this framework is intended to support this journey.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Results:&#x00a0;</italic>
                                <italic>Prophage prediction performance: rather than only providing subjective &#x201c;best&#x201d; and &#x201c;worst&#x201d; designations, the numerical results should be provided too (e.g., accuracy of 0.9 +/- 0.1). Furthermore, what statistical metrics were used to designate &#x201c;best&#x201d; and &#x201c;worst&#x201d;?</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>This was partially available in Supp table 3, but given its importance, we have move this to a new table (Table 2) and include a new table (Table 3) for the benchmarking results. We have also calculated and report standard deviations where applicable. &#x201c;Best&#x201d; and &#x201c;Worst&#x201d; are simply designated based on the rankings of each prophage caller based on their scores for a given metric.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Caveats: The VIBRANT manuscript says that it also was developed to identify both temperate and virulent viral regions in metagenomes. FYI - we were not able to access the Supplementary datasets through the paper (but were able to retrieve them from bioRxiv).</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>Our apologies. The Genbank files are stored and can be retrieved using git-lfs. The Zenodo repo is a verbatim copy of the GitHub repo and does not resolve the git-lfs links to the GenBank files. We have added a section in underlying data to clarify this. We have also made sure there are instructions in the GitHub readme and genbank subfolder readme for syncing the GenBank files with git-lfs.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Suggestions:&#x00a0;</italic>
                                <italic>Overall, this comparison framework would benefit from simple, minor additions.&#x00a0;</italic>
                                <italic>Does the specific host (e.g., taxonomy) affect the results of prophage prediction for some tools? For tools that utilize HMM searches, the HMM databases may be biased towards certain groups (e.g., E. coli phages). We suggest that a comparison of precision/recall be compared to the source host.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> This is absolutely a consideration for every program and comes back to the problem of selection bias in the database. It&#x2019;s fundamentally not something we can solve in this update of the framework. We compared f1 scores for each tool against genus and the f1 scores of each genus across the population averages (see results and Figure S2a/b).</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Do the performance comparisons only take into account total prophage CDS predictions or also the completeness of predicted prophages? For example, identifying all prophages but only 50% of each of those prophages is different than identifying half of all prophages but 100% of each of those.&#x00a0;</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> The performance comparisons currently only compare the numbers of correctly labelled genes. If a user were manually curating their predictions, then it could be argued that partially capturing all prophages would be better than completely capturing half of the prophages. This is something we might be able to add in the future if there is enough interest.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Is there any effect on hosts with multiple prophages? Are some tools affected by this?</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> The number of prophages shouldn&#x2019;t impact the performance of any of the tools but this is not something we&#x2019;ve looked at specifically. Most genomes only have 1 or a few prophages and it would be difficult to draw any conclusions without more examples at the fringes (0 prophages or say more than 6 or so). It is certainly something to consider as the dataset grows.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Some tools will have predicted prophages that were not in the gold standard set (false positives). What measures were taken to ensure that none of these are real prophages that were missed within the manual curation?</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>The genomes are small enough that the entire genomes are thoroughly examined during manual curation. We don&#x2019;t anticipate enough errors to significantly affect the outcome of the evaluation. Nevertheless, we do anticipate that some corrections will need to be made over time, be that from missed prophages or incorrect prophage boundaries and we welcome feedback from the community about the prophage annotations.</p>
                        </list-item>
                    </list>
                </p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report91324">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.57937.r91324</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Nobrega</surname>
                        <given-names>Franklin</given-names>
                    </name>
                    <xref ref-type="aff" rid="r91324a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-8238-1083</uri>
                </contrib>
                <aff id="r91324a1">
                    <label>1</label>School of Biological Sciences, Faculty of Environmental and Life Sciences, University of Southampton, Southampton, UK</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>23</day>
                <month>8</month>
                <year>2021</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2021 Nobrega F</copyright-statement>
                <copyright-year>2021</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport91324" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.54449.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The manuscript by Roach and co-authors focuses on a crucial question on how to accurately determine prophage regions. With the increasing accessibility of HPC infrastructure by scholars, and the increasing number of open datasets available for mining, there is an urgent need to establish FAIR datasets to set a ground-truth for data analysis. This work sets the tone so the community can move away from using a favourite tool, to using the most accurate and reliable to address the question at hand. In particular, the tool performance part is excellently achieved, providing details for both the novice and the advanced user when considering a new tool for their pipeline. In sum, it was a pleasure to read this well-structured and well-balanced work, which I fully endorse. I would like to leave the authors with a few recommendations and suggestions.</p>
            <p> </p>
            <p> 
                <bold>Recommendations:</bold> 
                <list list-type="order">
                    <list-item>
                        <p>I believe the authors could use a more recent reference for Calendar, 1988 (Introduction).</p>
                    </list-item>
                    <list-item>
                        <p>Please provide the methods used for manual curation of prophage annotations, as this will contribute to increase the gold-standard genomes available.</p>
                    </list-item>
                    <list-item>
                        <p>What was the rationale for running PhiSpy using all modes, and not doing the same for other tools that also have different run modes? This would make for a more fair comparison.</p>
                    </list-item>
                    <list-item>
                        <p>Could the authors clarify which prophage prediction categories were considered for VirSorter and Virsorter2, as these will certainly affect the accuracy and recall results obtained. Similar comment for VIBRANT.</p>
                    </list-item>
                    <list-item>
                        <p>Data would benefit from statistical analysis.</p>
                    </list-item>
                </list> 
                <bold>Suggestions:</bold> 
                <list list-type="order">
                    <list-item>
                        <p>The first three lines of &#x201c;Benchmark metrics&#x201d; (Methods) seem to be more adequate to the Results section.</p>
                    </list-item>
                    <list-item>
                        <p>I would suggest that the authors summarize the information provided in &#x201c;Software compared&#x201d; (Results and discussion) as a supplementary table, since this will certainly be useful to the community.</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>No</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Phage biology, phage-host interactions</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment8049-91324">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Roach</surname>
                            <given-names>Michael</given-names>
                        </name>
                        <aff>Flinders University, Australia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>The authors declare that there are no conflicts of interest.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>5</day>
                    <month>4</month>
                    <year>2022</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Thank you so much for reviewing our manuscript. We hope that version 2 addresses the concerns with the manuscript which we outline below: 
                    <list list-type="bullet">
                        <list-item>
                            <p>
                                <italic>I believe the authors could use a more recent reference for Calendar, 1988 (Introduction).</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>We have updated this section with more recent references.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Please provide the methods used for manual curation of prophage annotations, as this will contribute to increase the gold-standard genomes available.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>Guidelines are now included in additional data.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>What was the rationale for running PhiSpy using all modes, and not doing the same for other tools that also have different run modes? This would make for a more fair comparison.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>We developed PhiSpy and are well familiar with the different ways of running the pipeline. To keep the comparison fair, we now only present running PhiSpy with default parameters.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Could the authors clarify which prophage prediction categories were considered for VirSorter and Virsorter2, as these will certainly affect the accuracy and recall results obtained. Similar comment for VIBRANT.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response:</bold> Following valuable contributions and input from SR&#x2014;now a coauthor on this paper&#x2014;the Virsorter categories 1-5 are taken as prophage predictions. Virsorter2 is run with --high-confidence-only --exclude-lt2gene and we accept both predicted whole phages and integrated phage genomes as prophage predictions. VIBRANT is run with default parameters and we use all predictions from the integrated_prophage_coordinates output file.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Data would benefit from statistical analysis.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>We now include some statistical analysis as part of out database bias evaluation.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>Suggestions:</italic>&#x00a0;
                                <italic>The first three lines of &#x201c;Benchmark metrics&#x201d; (Methods) seem to be more adequate to the Results section.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>We agree, the sentence has been moved to the results section.</p>
                        </list-item>
                        <list-item>
                            <p>
                                <italic>I would suggest that the authors summarize the information provided in &#x201c;Software compared&#x201d; (Results and discussion) as a supplementary table, since this will certainly be useful to the community.</italic>
                            </p>
                        </list-item>
                        <list-item>
                            <p>
                                <bold>Response: </bold>We considered adding a more simplified summary table, such as ticks and crosses or 5-start ratings for various features, however these can be very subjective and would simply be our interpretation complete with our personal biases of the results.</p>
                        </list-item>
                    </list>
                </p>
            </body>
        </sub-article>
    </sub-article>
</article>
