<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="brief-report" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.72956.2</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Brief Report</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Differential enrichment of yeast DNA in SARS-CoV-2 and related genomes supports synthetic origin hypothesis</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 2; peer review: awaiting peer review]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Lisewski</surname>
                        <given-names>Andreas Martin</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-3403-6880</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Department of Life Sciences and Chemistry, Jacobs University Bremen, Bremen, 28759, Germany</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:a.lisewski@jacobs-university.de">a.lisewski@jacobs-university.de</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>14</day>
                <month>10</month>
                <year>2021</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2021</year>
            </pub-date>
            <volume>10</volume>
            <elocation-id>912</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>6</day>
                    <month>10</month>
                    <year>2021</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2021 Lisewski AM</copyright-statement>
                <copyright-year>2021</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/10-912/pdf"/>
            <abstract>
                <p>
                    <bold>Background:</bold> Knowledge about the origin of SARS-CoV-2 is necessary for both a biological and epidemiological understanding of the COVID-19 pandemic. Evidence suggests that a proximal evolutionary ancestor of SARS-CoV-2 belongs to the bat coronavirus family. However, as further evidence for a direct zoonosis remains limited, alternative modes of SARS-CoV-2 biogenesis should be also considered. </p>
                <p>
                    <bold>Results:</bold> Here we show that the genomes from SARS-CoV-2 and from SARS-CoV-1 are differentially enriched with short chromosomal sequences from the yeast 
                    <italic toggle="yes">S. cerevisiae</italic> at focal positions that are known to be critical for virus replication, host cell invasion, and host immune response. Specifically, for SARS-CoV-2, we identify two sites: one at the start of the viral replicase domain, and the other at the end of the spike gene past its critical domain junction; for SARS-CoV-1, one at the start of the RNA dependent RNA polymerase gene, and the other at the start of the spike protein&#x2019;s receptor binding domain. As yeast is not a natural host for this virus family, we propose a directed passage model for viral constructs, including virus replicase, in yeast cells based on co-transformation of virus DNA plasmids carrying yeast selectable genetic markers followed by intra-chromosomal homologous recombination through gene conversion. Highly differential sequence homology data across yeast chromosomes congruent with chromosomes harboring specific auxotrophic markers further support this passage model. Model and data together allow us to infer a hypothetical tripartite genome assembly scheme for the synthetic biogenesis of SARS-CoV-2 and SARS-CoV-1.</p>
                <p>
                    <bold>Conclusions:</bold> These results provide evidence that the genome sequences of SARS-CoV-1, SARS-CoV-2, but not that of RaTG13, BANAL-20-52 and all other closest SARS coronavirus family members identified, are carriers of distinct homology signals that might point to large-scale genomic editing during a passage of directed replication and chromosomal integration inside genetically modified yeast cells. </p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>SARS related coronavirus</kwd>
                <kwd>SARS-CoV-2</kwd>
                <kwd>SARS-CoV-1</kwd>
                <kwd>COVID-19</kwd>
                <kwd>virus passage</kwd>
                <kwd>yeast S. cerevisiae</kwd>
                <kwd>directed evolution</kwd>
                <kwd>genomic transformation</kwd>
                <kwd>genome editing</kwd>
                <kwd>synthetic biology</kwd>
            </kwd-group>
            <funding-group>
                <funding-statement>The author(s) declared that no grants were involved in supporting this work.</funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Updated</label>
                <title>Changes from Version 1</title>
                <p>Minor data changes included (due to recent publication of the BANAL-20-52 virus genome).</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec sec-type="intro">
            <title>Introduction</title>
            <p>From the beginning of the COVID-19 pandemic, in March 2020, evidence was put forward that the outbreak of novel coronavirus SARS-CoV-2 within the human population was most likely a product of natural evolution
                <sup>
                    <xref ref-type="bibr" rid="ref-1">1</xref>
                </sup>. According to this view, COVID-19 is a zoonosis that probably originated from a species of closely related bat coronaviruses
                <sup>
                    <xref ref-type="bibr" rid="ref-2">2</xref>
                </sup>. Prior to a hypothetical spillover event, a recent ancestor to SARS-CoV-2 likely evolved inside bat host cells for many decades
                <sup>
                    <xref ref-type="bibr" rid="ref-3">3</xref>
                </sup>. However, the natural evolution hypothesis of SARS-CoV-2 origin is currently not without considerable limitations: first, the difficulty in characterizing the evolutionary origin of the unusual poly-basic (RRAR) furin cleavage site at the S1/S2 junction of the SARS-COV-2 spike (S) glycoprotein
                <sup>
                    <xref ref-type="bibr" rid="ref-4">4</xref>
                </sup>; second, the discrepancy between an exponentially suppressed tropism of SARS-CoV-2 in 
                <italic toggle="yes">Rhinolophus sinicus</italic> bat cells
                <sup>
                    <xref ref-type="bibr" rid="ref-5">5</xref>
                </sup> and the high susceptibility of SARS-CoV-2 toward cell entry via 
                <italic toggle="yes">Rhinolophus sinicus</italic> angiotensin-converting enzyme 2, its primary entry receptor
                <sup>
                    <xref ref-type="bibr" rid="ref-6">6</xref>
                </sup>; and third, the persistent inability to identify an intermediate ancestral host between human and the horseshoe bat 
                <italic toggle="yes">Rhinolophus affinis</italic>. This species was reported to be the host of coronavirus RaTG13
                <sup>
                    <xref ref-type="bibr" rid="ref-7">7</xref>,
                    <xref ref-type="bibr" rid="ref-8">8</xref>
                </sup>, currently the isolate with the highest sequence similarity to the SARS-CoV-2 genome, which is located on the same phylogenetic branch as 
                <italic toggle="yes">Rhinolophus sinicus</italic> bat coronavirus
                <sup>
                    <xref ref-type="bibr" rid="ref-9">9</xref>
                </sup>. Finding the last animal progenitor host of SARS-CoV-2 has been further complicated by a continued uncertainty about the origin of RaTG13 itself
                <sup>
                    <xref ref-type="bibr" rid="ref-10">10</xref>,
                    <xref ref-type="bibr" rid="ref-11">11</xref>
                </sup>. In contrast to the natural evolution hypothesis for SARS-CoV-2, the above limitations do not necessarily apply to genetic engineering of viral genomes. For example, in the case of SARS coronavirus, it has long been established that introducing a synthetic poly-arginine construct at the furin cleavage site significantly increases the rate of entry into human cells compared with wild-type spike protein
                <sup>
                    <xref ref-type="bibr" rid="ref-12">12</xref>
                </sup>. Also before 2010, after a period of rapid progress in the understanding the relevant host-virus factors
                <sup>
                    <xref ref-type="bibr" rid="ref-13">13</xref>,
                    <xref ref-type="bibr" rid="ref-14">14</xref>
                </sup>,  natural barriers in host range of positive strand RNA viruses were rationally extended, leading to directed viral replication in new species including model organisms that originally were not permissive, such as the yeast 
                <italic toggle="yes">Saccharomyces cerevisiae</italic>
                <sup>
                    <xref ref-type="bibr" rid="ref-15">15</xref>
                </sup>. Accordingly, to transform yeast into a synthetic host for viral replication, the scheme has been to co-express viral RNA dependent RNA polymerase (RdRp) and, if also necessary for replication, additional viral factors on plasmids under the control of auxotrophic yeast selectable markers (YSM)
                <sup>
                    <xref ref-type="bibr" rid="ref-16">16</xref>
                </sup>. These selectable markers are primarily there to direct cell lines into stable expression of desired plasmid DNA, but at the same time may function as entry gates for directed insertion of exogenous genetic material into yeast chromosomes
                <sup>
                    <xref ref-type="bibr" rid="ref-17">17</xref>
                </sup>.  In principle, once the RdRp and required auxiliary factors are selectively and functionally expressed, this approach applies to any replication competent SARS coronavirus RNA, including cloned or 
                <italic toggle="yes">de novo</italic> synthesized genomic parts or even entire genomes, thus facilitating their replication as well as integration into the yeast genome. Our hypothesis is that such a passage would leave behind traces in the genomes of both the virus construct and the synthetic host.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <p>SARS and SARS-like betacoronavirus whole genome nucleotide sequences were taken from the comprehensive sequence and phylogenetic analyses by Zhou 
                <italic toggle="yes">et al</italic>.
                <sup>
                    <xref ref-type="bibr" rid="ref-18">18</xref>
                </sup> and from Li 
                <italic toggle="yes">et al.</italic>
                <sup>
                    <xref ref-type="bibr" rid="ref-9">9</xref>
                </sup>.  In our study, sequences were selected only if they had a valid 
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/genbank/">GenBank</ext-link> accession identifier or an NCBI Reference Sequence (RefSeq) accession identifier, as of 5 June 2021, resulting in the reference set of 13 whole genome virus sequences (see also Extended Data). BLAT whole genome comparative sequence analysis was performed using the 
                <ext-link ext-link-type="uri" xlink:href="https://genome-asia.ucsc.edu/cgi-bin/hgBlat">BLAT</ext-link> public webserver (BLAT, RRID:SCR_011919) with options set 
                <monospace>&#x201c;Genome: Search all&#x201d;</monospace> and 
                <monospace>&#x201c;All results (no minimum matches)&#x201d;</monospace>. Given each one of the corresponding 13 BLAT output tables produced from genomic alignments to the yeast 
                <italic toggle="yes">S. cerevisiae</italic> (Extended data Tables S2 &#x2013; S14), the profiled BLAT score
                <italic toggle="yes">, pS</italic>, was the genome-wide distribution of BLAT scores (output table column [SCORE]) weighted by the corresponding length of the homologous genomic region (output table distance between columns [START] and [END]). The cumulative profiled BLAT score 
                <italic toggle="yes">cS</italic>, which was used as a genome-wide quantitative indicator of yeast (
                <italic toggle="yes">S. cerevisiae</italic>) homology, was the total sum over this distribution. After shifting 
                <italic toggle="yes">cS</italic> by the sample&#x2019;s mean and dividing by its standard deviation, the resulting standardized BLAT 
                <italic toggle="yes">z</italic>-score became then a relative indicator of sequence homology with 
                <italic toggle="yes">S. cerevisiae</italic>. Sequence alignments for cross-validation were produced with 
                <monospace>lalign</monospace> from the 
                <ext-link ext-link-type="uri" xlink:href="https://fasta.bioch.virginia.edu/fasta_www2/fasta_down.shtml">fasta36-36.3.8/bin/lalign36</ext-link> software package (version number 36.3.8) with parameter settings: 
                <monospace>-f -12 -g 0 -E 1</monospace>. This parameter choice followed standard parameters for 
                <monospace>
                    <ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/Tools/psa/lalign/">LALIGN&#x2013;</ext-link>
                </monospace>.</p>
            <p>Sequence identities were calculated using the 
                <monospace>
                    <ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/Tools/msa/clustalo/">Clustal Omega</ext-link>
                </monospace> public webserver (RRID:SCR_001591) with standard preset parameters.</p>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <p>To interrogate the possibility that a similar passage through yeast cells took place within the family of SARS coronaviruses, we selected eight reference genomes
                <sup>
                    <xref ref-type="bibr" rid="ref-18">18</xref>
                </sup> for further analysis (see Methods): SARS-CoV-2 isolate Wuhan-Hu-1 (GenBank reference 
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/NC_045512.2/">NC_045512.2</ext-link>), 
                <italic toggle="yes">Rhinolophus affinis</italic> bat
                <italic toggle="yes"/> coronavirus RaTG13 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MN996532.2/">MN996532.2</ext-link>), 
                <italic toggle="yes">Rhinolophus pusillus</italic> SL-CoV ZXC21 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MG772934.1">MG772934.1</ext-link>), 
                <italic toggle="yes">Rhinolophus pusillus</italic> SL-CoV ZC45 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MG772933.1">MG772933.1</ext-link>), 
                <italic toggle="yes">Rhinolophus acuminatus</italic> bat coronavirus RacCS203 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MW251308.1">MW251308.1</ext-link>), 
                <italic toggle="yes">Rhinolophus cornutus</italic> bat coronavirus Rc-o319 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/LC556375.1">LC556375.1</ext-link>), SARS-CoV Urbani (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/AY278741.1">AY278741.1</ext-link>), and MERS-CoV isolate HCoV-EMC/2012 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/NC_019843.3">NC_019843.3</ext-link>). For comparative genomic sequence analysis we used a standard bioinformatics approach with the BLAST-like Alignment Tool (
                <ext-link ext-link-type="uri" xlink:href="http://genome.ucsc.edu/cgi-bin/hgBlat?command=start">BLAT</ext-link>) (BLAT, RRID:SCR_011919)
                <sup>
                    <xref ref-type="bibr" rid="ref-19">19</xref>
                </sup>. Each search from the above set of query sequences against the entire multi-species genome database produced a high number (between 1689 and 5083) of tiles, i.e. perfectly aligned short DNA sequences of length 11. A large majority of these tiles were repeatedly matched on the same two target genomes (out of 107 total; see also Extended data Table S1): SARS-CoV-2 (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/NC_045512.2">NC_045512.2</ext-link>), the only coronavirus genome in the database, and 
                <italic toggle="yes">S. cerevisiae</italic> (
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/assembly/GCF_000146045.2/">SacCer3/S288c</ext-link>). In these instances, BLAT identified many homologous regions by aggregating multiple tiles (Tables S2&#x2013;S9), and to each homologous region it produced an integer score 
                <italic toggle="yes">S</italic>, which is the number of perfectly matched positions therein. To obtain a genome-wide view of this homology signal we stacked together all homologous regions weighted by their individual alignment scores 
                <italic toggle="yes">S</italic>, which resulted in an accumulated homology profile, 
                <italic toggle="yes">pS</italic> (see Methods and Extended Data Figures S1 and S2). To remove its shortest-scale fluctuations, the profile was smoothed by a centered sliding window filter with window size of 200 nucleotides (
                <italic toggle="yes">nt</italic>). The output of eight genomic profiles (
                <xref ref-type="fig" rid="f1">Figure 1</xref> and Figure S2) were ordered by decreasing sequence identity to SARS-CoV-2.</p>
            <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                <label>Figure 1. </label>
                <caption>
                    <title>Profiled alignment scores (
                        <italic toggle="yes">pS</italic>) from the alignment output to the query input of six SARS-coronavirus related full genome sequences (for SL-ZC45 and SL-ZXC21 profiles, see Figure S2).</title>
                    <p>Alignment scores retrieved only from hits matching 
                        <italic toggle="yes">S. cerevisiae</italic> full genomic sequence assembly SacCer3/S288c. For the corresponding BLAT output, see Table S1, and Table S2&#x2013;S9. Upper left, in parentheses, percent sequence identity of query genome to SARS-CoV-2. Of note, detected yeast homology signals, nucleotide sequence similarity, and geographic location (
                        <italic toggle="yes">region, country</italic>) of first identified isolates do not converge. Abbreviations: nsp3C, non-structural protein 3 C-terminal domain [
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/protein/YP_009724389.1?report=graph&amp;from=2232&amp;to=2762">YP_009724389.1 (2,232..2,762)</ext-link>]; Rbd, receptor binding domain [SARS-CoV-2: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/protein/YP_009724390.1?report=graph&amp;from=319&amp;to=541">YP_009724390.1 (319..541)</ext-link>; SARS-CoV-1: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/protein/AAP13441.1?report=graph&amp;from=317&amp;to=569">AAP13441.1 (317..569)</ext-link>]; S_S1/S2, spike (S) protein S1/S2 domain cleavage region and the S2 fusion subunit [
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/protein/YP_009724390.1?report=graph&amp;from=543&amp;to=1208">YP_009724390.1 (543..1,208)</ext-link>]; RdRpN, N-terminal region of the RNA dependent RNA polymerase [
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/protein/AAP13442.1?report=graph&amp;from=4383&amp;to=4735">AAP13442.1 (4,383..4,735)</ext-link>].</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/78248/0577e670-5963-41e4-b157-9e1329069991_figure1.gif"/>
            </fig>
            <p>For SARS-CoV-2, two prominent (
                <italic toggle="yes">pS</italic> &gt; 20) peaks indicated highly localized profile scores at levels ~10-fold above the apparent background. A first peak (
                <italic toggle="yes">P</italic>1) reaching a top alignment score of 47 in the narrow genomic interval [7191 
                <italic toggle="yes">nt</italic>..7192 
                <italic toggle="yes">nt</italic>]
                <sub>max</sub>, and a second peak 
                <italic toggle="yes">P</italic>2 over ~18,000 
                <italic toggle="yes">nt</italic> downstream with a score of 36 in the region [25196 
                <italic toggle="yes">nt</italic>..25212 
                <italic toggle="yes">nt</italic>]
                <sub>max</sub> (see, 
                <xref ref-type="fig" rid="f1">Figure 1</xref>). To put these data into an established gene-function context these two maxima, with half-maximum widths 
                <italic toggle="yes">w</italic>
                <sub>1/2 </sub>= 215 
                <italic toggle="yes">nt</italic> and 
                <italic toggle="yes">w</italic>
                <sub>1/2  </sub>= 219 
                <italic toggle="yes">nt</italic>, respectively, were annotated with available information from the closest and most specifically annotated genomic region in RefSeq, the NCBI Reference Sequence database
                <sup>
                    <xref ref-type="bibr" rid="ref-20">20</xref>
                </sup>. Thus 
                <italic toggle="yes">P</italic>1 was closest to the start of the C-terminal domain of non-structural protein 3 (designated nsp3C), which extends over the interval [6962 
                <italic toggle="yes">nt</italic>..8552 
                <italic toggle="yes">nt</italic>]. The C-terminal domain of nsp3 is known to play a critical role in replication due to its direct interaction with nsp4, thereby facilitating virus-induced membrane rearrangement and replication complex formation; conversely, loss of nsp3C-nsp4 interaction abolishes SARS coronavirus replication
                <sup>
                    <xref ref-type="bibr" rid="ref-21">21</xref>
                </sup>. 
                <italic toggle="yes">P</italic>2 was located toward the 3&#x2032; end of the open reading frame of the spike gene. Here it overlapped with the 3&#x2032; end of the stretch that covers both the S1/S2 cleavage region and the S2 fusion subunit of the S protein (S_S1/S2, with interval [23192 
                <italic toggle="yes">nt</italic>..25187 
                <italic toggle="yes">nt</italic>]). The S_S1/S2 domain includes the characteristic furin cleavage site at the S1/S2 junction
                <sup>
                    <xref ref-type="bibr" rid="ref-22">22</xref>
                </sup>.  Cleavage activates the nearby S2 fusion peptide and together they constitute an essential part in SARS-CoV-2 particle-dependent and particle-independent cell entry through fusion of viral and cellular membranes
                <sup>
                    <xref ref-type="bibr" rid="ref-23">23</xref>,
                    <xref ref-type="bibr" rid="ref-24">24</xref>
                </sup>. A similar analysis for the RaTG13 viral genome identified only one isolated peak (
                <italic toggle="yes">P</italic>3) with a maximum profile score of 50 on the interval [9713 
                <italic toggle="yes">nt</italic>..9733 
                <italic toggle="yes">nt</italic>]
                <sub>max</sub>, and with 
                <italic toggle="yes">w</italic>
                <sub>1/2</sub> = 230 
                <italic toggle="yes">nt</italic>. It intersected with the coding region of the C-terminal domain of nsp4 located at [9770 
                <italic toggle="yes">nt</italic>..10046 
                <italic toggle="yes">nt</italic>] (
                <xref ref-type="fig" rid="f1">Figure 1</xref>).</p>
            <p>In the SARS coronavirus Urbani genome (SARS-CoV-1), two additional signals were detected: 
                <italic toggle="yes">P</italic>4 with a maximum score 
                <italic toggle="yes">pS</italic> = 26 at position [13486 
                <italic toggle="yes">nt</italic>..13497 
                <italic toggle="yes">nt</italic>]
                <sub>max</sub> and 
                <italic toggle="yes">w</italic>
                <sub>1/2</sub> = 222 
                <italic toggle="yes">nt</italic>; and a broader second peak, 
                <italic toggle="yes">P</italic>5, with 
                <italic toggle="yes">pS</italic> = 41 at position [22286 
                <italic toggle="yes">nt</italic>..22391 
                <italic toggle="yes">nt</italic>]
                <sub>max</sub> and 
                <italic toggle="yes">w</italic>
                <sub>1/2</sub> = 477 
                <italic toggle="yes">nt. P</italic>4 sharply co-localized with the N-terminus of the RdRp domain at [13414 
                <italic toggle="yes">nt</italic>..14470 
                <italic toggle="yes">nt</italic>]. 
                <italic toggle="yes">P</italic>5 was annotated with the N-terminal part of the spike gene&#x2019;s receptor binding domain (Rbd) located in the interval [22443 
                <italic toggle="yes">nt</italic>..23199 
                <italic toggle="yes">nt</italic>]. In contrast to the five signals identified in these three genomes, an equivalent analysis for the other three (RacCS203, Rc-o319, MERS-CoV) produced only negative results. Their accumulated homology profiles were evenly distributed across the entire genomes consistent with a low random score background from many short spurious matches. As a further specificity control, negative results were obtained (see, Figure S3 and Tables S10&#x2013;S14) after profiling the five most closely SARS-CoV-1 related betacoronavirus isolates from five wild animals (civet, 
                <italic toggle="yes">Paradoxurus hermaphroditus</italic>, 
                <italic toggle="yes">Paguma larvata</italic>, 
                <italic toggle="yes">Aselliscus stoliczkanus</italic>, and 
                <italic toggle="yes">Rhinolophus sinicus</italic>), which together with SARS-CoV-2 occupy the same phylogenetic branch
                <sup>
                    <xref ref-type="bibr" rid="ref-9">9</xref>
                </sup>. These data signature of yeast homology in SARS-CoV-1, SARS-CoV-2 and RaTG13 genomes after calculating standardized 
                <italic toggle="yes">z</italic>-scores (
                <xref ref-type="fig" rid="f2">Figure 2</xref>) from the entire BLAT profiles produced to all 13 of the above sequences (Tables S2&#x2013;S14). This analysis was also extended by including the three recently identified bat SARS-like coronavirus genomes from the same clade as RaTG13 (
                <italic toggle="yes">z</italic> = 4.72), i.e., BANAL-20-52 (
                <italic toggle="yes">z</italic> = 0.36), BANAL-20-103 (z = &#x2013;1.56) and BANAL-20-236 (
                <italic toggle="yes">z</italic> = 0.20), which all produced markedly smaller 
                <italic toggle="yes">z</italic>-scores than SARS-CoV-1 (
                <italic toggle="yes">z</italic> = 9.44) and SARS-CoV-2 (z = 5.47). To cross-validate the detected yeast homology signals in 
                <italic toggle="yes">P</italic>1-
                <italic toggle="yes">P</italic>5, we also used an independent sequence alignment method, LALIGN
                <sup>
                    <xref ref-type="bibr" rid="ref-25">25</xref>
                </sup>, which additionally produced statistics (
                <italic toggle="yes">E</italic>-values) for pairwise alignments. While the peaks 
                <italic toggle="yes">P</italic>1 and 
                <italic toggle="yes">P</italic>2, as well as 
                <italic toggle="yes">P</italic>4 and 
                <italic toggle="yes">P</italic>5, could be positively cross-validated, the 
                <italic toggle="yes">P</italic>3 signal in RaTG13 detected by BLAT did not yield a statistically significant alignment with LALIGN, with its 
                <italic toggle="yes">E</italic>-value reaching above 0.01 (see, Table S16 and Figure S4). Taken together, these highly differential data show that, for SARS-CoV-1 and for SARS-CoV-2, genes known to be critical for viral replication and host cell invasion display localized yeast homology at their flanking regions with limited extensions into the corresponding open reading frames.</p>
            <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                <label>Figure 2. </label>
                <caption>
                    <title>Yeast (
                        <italic toggle="yes">S. cerevisiae</italic>) standardized BLAT 
                        <italic toggle="yes">z</italic>-scores representing the relative homology signal from all alignment scores in thirteen representative SARS-related coronaviruses.</title>
                    <p>BLAT 
                        <italic toggle="yes">z</italic>-scores were calculated using mean and standard deviations from the BLAT outputs (see, Table S2&#x2013;S14 and Methods section). Evolutionary guide tree represents pairwise sequence identities between genomic sequences (see, Table S15). Grey shaded box indicates [&#x2212;1, 1] standard deviation interval.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/78248/0577e670-5963-41e4-b157-9e1329069991_figure2.gif"/>
            </fig>
            <p>To explain this yeast DNA enrichment pattern, we propose the following artificial passage model (
                <xref ref-type="fig" rid="f3">Figure 3A</xref>): Its starting point is a doubly auxotrophic, synthetic yeast cell line with stable, heterologous expression of viral replicase complex (RdRp, optionally together with auxiliary factors for replication, Aux) from a plasmid under the control of a selectable marker YSM1. A second plasmid carries another auxotrophic yeast selectable marker YSM2, which originates from a different chromosome, and regulates the expression of a non-replicative segment of viral RNA (nrvRNA1). At this point, nrvRNA1 is any uninterrupted DNA segment from a SARS-coronavirus related genome prior to passage. Through homologous recombination, the target yeast chromosome is transformed and nrvRNA1 is integrated
                <sup>
                    <xref ref-type="bibr" rid="ref-17">17</xref>
                </sup> at the chromosomal site of the auxotrophy conferring allele homologous to YSM2. During passage cell growth double stranded DNA breaks occur, and breaks at both ends of nrvRNA1 ends, their flanking regions, and their homologous extensions into YSM2 are repaired preferably by intra-chromosomal gene conversion
                <sup>
                    <xref ref-type="bibr" rid="ref-26">26</xref>
                </sup>, i.e. through a non-crossover homologous recombination, and with the endogenous site as the homologous repair donor (
                <xref ref-type="fig" rid="f3">Figure 3A</xref>).</p>
            <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                <label>Figure 3. </label>
                <caption>
                    <p>(
                        <bold>A</bold>) First stage of passage model in the artificial host 
                        <italic toggle="yes">S. cerevisiae</italic> of a plasmid encoded, non-replicable viral RNA (nrvRNA1) originating from a SARS-CoV related virus. Primary integration of non-homologous nrvRNA1 sequence occurs through homologous recombination (HR) between the auxotrophic plasmid yeast selectable marker YSM1 (grey box) and its chromosomal homolog (striped grey box); higher-order homologous recombination follows on the flanking regions of nrvRNA1 through intra-chromosomal gene-conversion; co-expression of viral replicase complex (RdRp) and other auxiliary viral genes (Aux). Scheme in parts adapted from Compton 
                        <italic toggle="yes">et al</italic>. (1982), and from Alves-Rodrigues 
                        <italic toggle="yes">et al</italic>. (2006). P, yeast promoter; A
                        <sub>
                            <italic toggle="yes">n</italic>
                        </sub>, poly-adenosine sequence. (
                        <bold>B</bold>) Integrated profile scores, 
                        <italic toggle="yes">cS</italic>, from BLAT sequence hits on 
                        <italic toggle="yes">S. cerevisiae</italic> by chromosome number from the same six input sequences as in 
                        <xref ref-type="fig" rid="f1">Figure 1</xref> (purple columns); to calculate 
                        <italic toggle="yes">cS</italic>, a score profile cutoff 
                        <italic toggle="yes">pS</italic> &gt; 30 was used. Without a cut-off (
                        <italic toggle="yes">pS</italic> &gt; 0), the same order emerged (black horizontal bars, maximum 
                        <italic toggle="yes">pS</italic> score at each chromosome; all other maximum 
                        <italic toggle="yes">pS</italic> scores from the other genomic queries are below, within shaded area). Five common yeast selectable markers are assigned to their chromosomes of origin. (
                        <bold>C</bold>) Procedural second stage scheme for the synthetic biogenesis of SARS-CoV-2 and SARS-CoV-1. For the possible pairings of yeast selectable markers (YSM1, YSM2) matched in (
                        <bold>B</bold>), genome editing of the three segments nrvRNA1, 2, 3 leads to a fully replicable virus (+)sense RNA. Virus (self-)assembly follows via expression of the structural proteins S, E, M, and N from an enhanced plasmid set Aux*. Rz, self-cleaving ribozyme.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/78248/0577e670-5963-41e4-b157-9e1329069991_figure3.gif"/>
            </fig>
            <p>If we assume that nrvRNA1 itself contains a copy of RdRp (and of Aux), then the above model implies that higher-order integration events
                <sup>
                    <xref ref-type="bibr" rid="ref-17">17</xref>
                </sup> will occur between the YSM1 plasmid and the primary site of integration. In effect, short segments from its YSM1 region will be also integrated into nrvRNA1.  In this case the passage model specifically predicts that during 
                <italic toggle="yes">S. cerevisiae</italic> growth nrvRNA1 will accumulate sequences from exactly two yeast chromosomes, i.e. those two which YSM1 and YSM2 originated from.</p>
            <p>To test this prediction, we produced the score profile 
                <italic toggle="yes">pS</italic>, but this time from the yeast sequence hits on each chromosome. For direct comparison, we then transformed each profile into a single number (
                <italic toggle="yes">cS</italic>), for all 16 chromosomes (mitochondrial chromosome excluded), by calculating the sum of 
                <italic toggle="yes">pS</italic> over the entire chromosome length conditional on the cutoff 
                <italic toggle="yes">pS</italic> &gt; 30. In the case of SARS-CoV-2, this procedure resulted in two distinct peaks at chromosome number II and number XV (
                <xref ref-type="fig" rid="f3">Figure 3B</xref>). For SARS-CoV-1, the highest two peaks were at chromosomes IV and V, followed by a much shallower peak on XVI with only 0.24 the height of IV. One peak was detected for RaTG13, also at XVI, whereas the other three viral genomes produced no signal at the chosen cutoff (see, 
                <xref ref-type="fig" rid="f3">Figure 3B</xref>, also for similar data without a cutoff). To further connect these data to our passage model, we attempted to match the seven most commonly used auxotrophic yeast selectable markers
                <sup>
                    <xref ref-type="bibr" rid="ref-27">27</xref>,
                    <xref ref-type="bibr" rid="ref-28">28</xref>
                </sup> according to their chromosomal origin: ADE2 (adenine requiring 
                <italic toggle="yes">phosphoribosylaminoimidazole carboxylase</italic>, on chromosome XV), HIS3 (histidine requiring 
                <italic toggle="yes">imidazoleglycerol-phosphate dehydratase</italic>, chr. XV), LEU2 (leucine requiring 
                <italic toggle="yes">Beta-isopropylmalate dehydrogenase</italic>, chr. III), LYS2 (lysine requiring 
                <italic toggle="yes">aminoadipate reductase</italic>, chr. II), MET15 (methionine requiring 
                <italic toggle="yes">O-acetyl homoserine-O-acetyl serine sulfhydrylase</italic>, chr. XII), URA3 (uracil requiring 
                <italic toggle="yes">orotidine-5'-phosphate (OMP) decarboxylase</italic>, chr.V), and TRP1 (tryptophan requiring 
                <italic toggle="yes">phosphoribosylanthranilate isomerase</italic>, chr. IV). In agreement with the model prediction, five out the seven markers could be matched to the four highest of the five chromosome peaks detected in SARS-CoV-2 and SARS-CoV-1 (
                <xref ref-type="fig" rid="f3">Figure 3B</xref>). This outcome especially implies that for SARS-CoV-2 the two auxotrophic markers (YSM1, YSM2) could be any pair from the triple (ADE2, HIS3, LYS2), and for SARS-CoV-1 either the pair (LEU2, TRP1) or (TRP1, LEU2). Thus SARS-CoV-2 and SARS-CoV-1 both did, but RaTG13 did not fit into this synthetic passage model.</p>
            <p>These results further allowed us to infer a specific scheme for the synthetic biogenesis of SARS-CoV-2 and SARS-CoV-1 in transformed yeast cells (
                <xref ref-type="fig" rid="f3">Figure 3C</xref>). The idea is to stitch together both outer DNA complements of a chosen viral genome with the inner segment nrvRNA1. For co-transformation and integration, two plasmids are designed that carry the YSM2 selectable marker with either the 5&#x2032;-end (nrvRNA2) or the 3&#x2032;-end (nrvRNA3) of the target virus genome along with some overlap into nrvRNA1 (regions 1&#x2032; and 1&#x2032;&#x2032;, respectively, see 
                <xref ref-type="fig" rid="f3">Figure 3C</xref>). Essential plasmid ingredients are also a transcriptional promoter for nrvRNA2, and a self-cleaving ribozyme (Rz) sequence for the correct 3&#x2032;-end in nrvRNA3
                <sup>
                    <xref ref-type="bibr" rid="ref-15">15</xref>
                </sup>. Once these three non-replicable RNA encoding segments are integrated on the chromosome in the correct order, expression of fully replicable virus (+)RNA begins and replication commences upon co-expression of the viral replicase complex (RdRp and Aux, controlled through the auxotrophic marker YSM1). The final step, assembly into a fully infectious viral particle, is conveniently achieved with a yeast virus-like-particle (VLP) expression system for the structural proteins S, E (envelope), M (membrane), and N (nucleocapsid) that can be used in parallel by an extended set of auxiliary proteins, Aux*
                <sup>
                    <xref ref-type="bibr" rid="ref-29">29</xref>
                </sup>. This hypothetical cellular factory may therefore produce the targeted, fully infectious viral particles without itself being infected by the virus produced.</p>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <p>Taken together, our results reveal a highly differential homology signal on SARS-CoV-2 and SARS-CoV-1 genomes, which&#x2014;according to our model&#x2014;points to their history of targeted integration, recombination, and directed viral replication through passage in an artificial 
                <italic toggle="yes">S. cerevisiae</italic> host. This genomic pattern suggests similar synthetic origins of SARS-CoV-1 and SARS-CoV-2, but at the same time robustly excludes all other clade members from this type of synthetic origin. A special case is RaTG13, which in our analysis produced both a simpler pattern and a weaker signal of common genetic history with yeast than the two mutually more similar homology signals found in SARS-CoV-1 and SARS-CoV-2. Yet RaTG13 is claimed to be much closer to SARS-CoV-2 evolutionarily
                <sup>
                    <xref ref-type="bibr" rid="ref-7">7</xref>
                </sup>, i.e. 96% genomic sequence identity to SARS-CoV-2 against 80% between SARS-CoV-1 and the latter. This divergence suggests that if RaTG13 is assumed to be a product of natural evolution then both the sequences of SARS-CoV-1 and SARS-CoV-2 cannot be. Alternatively, the origin of RaTG13 could be artificial
                <sup>
                    <xref ref-type="bibr" rid="ref-11">11</xref>
                </sup>&#x2014;along with SARS-CoV-2 and SARS-CoV-1
                <sup>
                    <xref ref-type="bibr" rid="ref-30">30</xref>
                </sup>, as our results also suggest. In this context, a point of uttermost importance would be the identification of the putative input progenitor SARS-CoV nucleotide sequence that went into passage. For example, it could be a highly pathogenic virus designed for, or naturally adapted to human cells and then selected for a transient artificial passage together with some genetic modifications
                <sup>
                    <xref ref-type="bibr" rid="ref-31">31</xref>
                </sup> of the virus to attenuate its virulence. Then its release back into the human host would likely initiate a rapid succession of complex reversal mutations toward its more pathogenic original structure
                <sup>
                    <xref ref-type="bibr" rid="ref-30">30</xref>,
                    <xref ref-type="bibr" rid="ref-31">31</xref>
                </sup>. Intriguingly, during the first months of the SARS-CoV-2 outbreak, the genomic regions of nsp3 and spike protein had the highest mutational rate within the SARS-CoV-2 genome
                <sup>
                    <xref ref-type="bibr" rid="ref-32">32</xref>
                </sup> which may interfere with the yeast homology signal detected in the present study. During an epidemic, such reversal mutations toward an unidentified artificial genotype would be highly detrimental to most public health countermeasures, including pharmacological interventions and vaccinations. In contrast, through specific guidance of countermeasures such as vaccine development, detailed knowledge about the input progenitor&#x2019;s nucleotide sequence would effectively confer population immunity against the pathogen. Without such specific knowledge, our and further results about the conditions of the yeast artificial passage could offer important directions for SARS-CoV-2 antiviral interventions.</p>
        </sec>
        <sec>
            <title>Data availability</title>
            <p>
                <italic toggle="yes">Associated or additional data</italic>. All data underlying the results are available as part of the article and no additional source data are required.</p>
            <p>
                <italic toggle="yes">Repository-hosted data.</italic> The following sequence data was retrieved from the NCBI GenBank repository:</p>
            <list list-type="bullet">
                <list-item>
                    <label>1. </label>
                    <p>Middle East respiratory syndrome-related coronavirus isolate HCoV-EMC/2012, complete genome (NCBI Reference Sequence: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/NC_019843.3">NC_019843.3</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>2. </label>
                    <p>Severe acute respiratory syndrome-related coronavirus Rc-o319 RNA, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/LC556375.1">LC556375.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>3. </label>
                    <p>Bat SARS-like coronavirus isolate As6526, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/KY417142.1">KY417142.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>4. </label>
                    <p>Bat SARS-like coronavirus isolate Rs4874, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/KY417150.1">KY417150.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>5. </label>
                    <p>SARS coronavirus Urbani, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/AY278741.1">AY278741.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>6. </label>
                    <p>SARS coronavirus PC4-13, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/AY613948.1">AY613948.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>7. </label>
                    <p>SARS coronavirus civet020, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/AY572038.1">AY572038.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>8. </label>
                    <p>SARS coronavirus HC/SZ/61/03, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/AY515512.1">AY515512.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>9. </label>
                    <p>Bat SARS-like coronavirus isolate bat-SL-CoVZC45, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MG772933.1">MG772933.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>10. </label>
                    <p> Bat SARS-like coronavirus isolate bat-SL-CoVZXC21, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MG772934.1">MG772934.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>11. </label>
                    <p> Bat coronavirus RacCS203, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MW251308.1">MW251308.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>12. </label>
                    <p> Severe acute respiratory syndrome coronavirus 2 isolate Wuhan-Hu-1, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/NC_045512.2">NC_045512.2</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>13. </label>
                    <p> Bat coronavirus RaTG13, complete genome (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MW251308.1">MN996532.2</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>14. </label>
                    <p>Bat coronavirus isolate BANAL-20-52/Laos/2020 (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MZ937000.1">MZ937000.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>15. </label>
                    <p>Bat coronavirus isolate BANAL-20-103/Laos/2020 (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MZ937001.1">MZ937001.1</ext-link>)</p>
                </list-item>
                <list-item>
                    <label>16. </label>
                    <p>Bat coronavirus isolate BANAL-20-236/Laos/2020 (GenBank: 
                        <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/MZ937003.1">MZ937003.1</ext-link>)</p>
                </list-item>
            </list>
            <sec>
                <title>Extended data</title>
                <p>Harvard Dataverse: Differential enrichment of yeast DNA in SARS-CoV-2 and related genomes supports synthetic origin hypothesis. 
                    <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.7910/DVN/BK8AL6">https://doi.org/10.7910/DVN/BK8AL6</ext-link>
                    <sup>
                        <xref ref-type="bibr" rid="ref-33">33</xref>
                    </sup>.</p>
                <p>This project contains the following extended data files:</p>
                <list list-type="bullet">
                    <list-item>
                        <p>Figure_S1.pdf : Profiled alignment scores (pS) without smoothing filter from the BLAT alignment output to the query input of six SARS-coronavirus related full genome nucleotide sequences.</p>
                    </list-item>
                    <list-item>
                        <p>Figure_S2.pdf : Profiled alignment scores (pS) from the alignment output to the query input of SARS-coronavirus like genome sequences SL-ZC45 and SL-ZXC21.</p>
                    </list-item>
                    <list-item>
                        <p>Figure_S3.pdf : Smoothed profile yeast BLAT alignment scores of five betacoronavirus isolates from five wild animals, closely related to SARS-CoV-1 and SARS-CoV-2, after the phylogenetic analysis of Li 
                            <italic toggle="yes">et al.</italic> (2020): 
                            <italic toggle="yes">Paradoxurus hermaphroditus</italic> (palm civet) SARS coronavirus PC4-13 (GenBank AY613948), Civet SARS coronavirus civet020 (AY572038), 
                            <italic toggle="yes">Paguma larvata</italic> SARS coronavirus HC/SZ/61/03 (AY515512), 
                            <italic toggle="yes">Rhinolophus sinicus</italic> bat SARS-like coronavirus Rs4874 (KY417150), 
                            <italic toggle="yes">Aselliscus stoliczkanus</italic> bat SARS-like coronavirus As6526 (KY417142).</p>
                    </list-item>
                    <list-item>
                        <p>Figure_S4.pdf : Alignment E-values (inverted, 1/E) as profiles across genomes of SARS-CoV-2, RaTG13, and SARS-CoV-1 calculated with the LALIGN local alignment method by using a sliding window approach with window sizes as given in Table S16.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S1.tab: Output from the 
                            <ext-link ext-link-type="uri" xlink:href="https://genome-asia.ucsc.edu/cgi-bin/hgBlat">BLAT web server</ext-link>.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S2.tab: SARS-CoV-2/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S3.tab: RaTG13/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S4.tab: RacCS203/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S5.tab: SL-CoV_ZC45/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S6.tab: SL-CoV ZXC21/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S7.tab: Rc-o319/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S8.tab: SARS-CoV-1 Urbani/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S9.tab: MERS-CoV/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S10.tab: SARS coronavirus PC4-13/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S11.tab: SARS coronavirus civet020/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S12.tab: SARS coronavirus HC/SZ/61/03/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S13.tab: SARS-like coronavirus isolate Rs4874 /S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S14.tab: SARS-like coronavirus isolate As6526/S. cerevisiae (sacCer3) BLAT results.</p>
                    </list-item>
                    <list-item>
                        <p>Table_S15.tab: Percent identity matrix (Clustal 2.1).</p>
                    </list-item>
                    <list-item>
                        <p>Table_S16.tab: Peak P1-P5 yeast homology signals detected by BLAT, and cross-validated by the LALIGN method.</p>
                    </list-item>
                </list>
            </sec>
        </sec>
    </body>
    <back>
        <ref-list>
            <ref id="ref-1">
                <label>1</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Andersen</surname>
                            <given-names>KG</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Rambaut</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lipkin</surname>
                            <given-names>WI</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The proximal origin of SARS-CoV-2.</article-title>
                    <source>

                        <italic toggle="yes">Nat Med.</italic>
</source>
                    <year>2020</year>;<volume>26</volume>(<issue>4</issue>):<fpage>450</fpage>&#x2013;<lpage>2</lpage>.
                    <pub-id pub-id-type="pmid">32284615</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41591-020-0820-9</pub-id>
                    <pub-id pub-id-type="pmcid">7095063</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-2">
                <label>2</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>MacLean</surname>
                            <given-names>OA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lytras</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Weaver</surname>
                            <given-names>S</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Natural selection in the evolution of SARS-CoV-2 in bats created a generalist virus and highly capable human pathogen.</article-title>
                    <source>

                        <italic toggle="yes">PLoS Biol.</italic>
</source>
                    <year>2021</year>;<volume>19</volume>(<issue>3</issue>):<fpage>e3001115</fpage>.
                    <pub-id pub-id-type="pmid">33711012</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pbio.3001115</pub-id>
                    <pub-id pub-id-type="pmcid">7990310</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-3">
                <label>3</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Boni</surname>
                            <given-names>MF</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lemey</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jiang</surname>
                            <given-names>X</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Evolutionary origins of the SARS-CoV-2 sarbecovirus lineage responsible for the COVID-19 pandemic.</article-title>
                    <source>

                        <italic toggle="yes">Nat Microbiol.</italic>
</source>
                    <year>2020</year>;<volume>5</volume>(<issue>11</issue>):<fpage>1408</fpage>&#x2013;<lpage>17</lpage>.
                    <pub-id pub-id-type="pmid">32724171</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41564-020-0771-4</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-4">
                <label>4</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gallaher</surname>
                            <given-names>WR</given-names>
                        </name>
</person-group>:
                    <article-title>A palindromic RNA sequence as a common breakpoint contributor to copy-choice recombination in SARS-COV-2.</article-title>
                    <source>

                        <italic toggle="yes">Arch Virol.</italic>
</source>
                    <year>2020</year>;<volume>65</volume>(<issue>10</issue>):<fpage>2341</fpage>&#x2013;<lpage>2348</lpage>.
                    <pub-id pub-id-type="pmid">32737584</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s00705-020-04750-z</pub-id>
                    <pub-id pub-id-type="pmcid">7394270</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-5">
                <label>5</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Lau</surname>
                            <given-names>SKP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Wong</surname>
                            <given-names>ACP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Luk</surname>
                            <given-names>HKH</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Differential Tropism of SARS-CoV and SARS-CoV-2 in Bat Cells.</article-title>
                    <source>

                        <italic toggle="yes">Emerg Infect Dis.</italic>
</source>
                    <year>2020</year>;<volume>26</volume>(<issue>12</issue>):<fpage>2961</fpage>&#x2013;<lpage>5</lpage>.
                    <pub-id pub-id-type="pmid">32730733</pub-id>
                    <pub-id pub-id-type="doi">10.3201/eid2612.202308</pub-id>
                    <pub-id pub-id-type="pmcid">7706959</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-6">
                <label>6</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>HL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>YM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sun</surname>
                            <given-names>J</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Evaluating angiotensin-converting enzyme 2-mediated SARS-CoV-2 entry across species.</article-title>
                    <source>

                        <italic toggle="yes">J Biol Chem.</italic>
</source>
                    <year>2021</year>;<volume>296</volume>:<fpage>100435</fpage>.
                    <pub-id pub-id-type="pmid">33610551</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.jbc.2021.100435</pub-id>
                    <pub-id pub-id-type="pmcid">7892319</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-7">
                <label>7</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>XL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>XG</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A pneumonia outbreak associated with a new coronavirus of probable bat origin.</article-title>
                    <source>

                        <italic toggle="yes">Nature.</italic>
</source>
                    <year>2020</year>;<volume>579</volume>(<issue>7798</issue>):<fpage>270</fpage>&#x2013;<lpage>3</lpage>.
                    <pub-id pub-id-type="pmid">32015507</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41586-020-2012-7</pub-id>
                    <pub-id pub-id-type="pmcid">7095418</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-8">
                <label>8</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>XL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>XG</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Addendum: A pneumonia outbreak associated with a new coronavirus of probable bat origin.</article-title>
                    <source>

                        <italic toggle="yes">Nature.</italic>
</source>
                    <year>2020</year>;<volume>588</volume>(<issue>7836</issue>):<fpage>E6</fpage>.
                    <pub-id pub-id-type="pmid">33199918</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41586-020-2951-z</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-9">
                <label>9</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ren</surname>
                            <given-names>L</given-names>
                        </name>
</person-group>:
                    <article-title>Genetic evolution analysis of 2019 novel coronavirus and coronavirus from other species.</article-title>
                    <source>

                        <italic toggle="yes">Infect Genet Evol.</italic>
</source>
                    <year>2020</year>;<volume>82</volume>:<fpage>104285</fpage>.
                    <pub-id pub-id-type="pmid">32169673</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.meegid.2020.104285</pub-id>
                    <pub-id pub-id-type="pmcid">7270525</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-10">
                <label>10</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sallard</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Halloy</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Casane</surname>
                            <given-names>D</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Tracing the origins of SARS-COV-2 in coronavirus phylogenies: a review.</article-title>
                    <source>

                        <italic toggle="yes">Environ Chem Lett.</italic>
</source>
                    <year>2021</year>;<fpage>1</fpage>&#x2013;<lpage>17</lpage>.
                    <pub-id pub-id-type="pmid">33558807</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s10311-020-01151-1</pub-id>
                    <pub-id pub-id-type="pmcid">7859469</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-11">
                <label>11</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Deigin</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Segreto</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <article-title>SARS-CoV-2&#x2019;s claimed natural origin is undermined by issues with genome sequences of its relative strains: Coronavirus sequences RaTG13, MP789 and RmYN02 raise multiple questions to be critically addressed by the scientific community.</article-title>
                    <source>

                        <italic toggle="yes">Bioessays.</italic>
</source>
                    <year>2021</year>;<volume>43</volume>(<issue>7</issue>):<fpage>e2100015</fpage>.
                    <pub-id pub-id-type="pmid">34046923</pub-id>
                    <pub-id pub-id-type="doi">10.1002/bies.202100015</pub-id>
                    <pub-id pub-id-type="pmcid">8209872</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-12">
                <label>12</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Belouzard</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Chu</surname>
                            <given-names>VC</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Whittaker</surname>
                            <given-names>GR</given-names>
                        </name>
</person-group>:
                    <article-title>Activation of the SARS coronavirus spike protein via sequential proteolytic cleavage at two distinct sites.</article-title>
                    <source>

                        <italic toggle="yes">Proc Natl Acad Sci U S A.</italic>
</source>
                    <year>2009</year>;<volume>106</volume>(<issue>14</issue>):<fpage>5871</fpage>&#x2013;<lpage>6</lpage>.
                    <pub-id pub-id-type="pmid">19321428</pub-id>
                    <pub-id pub-id-type="doi">10.1073/pnas.0809524106</pub-id>
                    <pub-id pub-id-type="pmcid">2660061</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-13">
                <label>13</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kushner</surname>
                            <given-names>DB</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lindenbach</surname>
                            <given-names>BD</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Grdzelishvili</surname>
                            <given-names>VZ</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Systematic, genome-wide identification of host genes affecting replication of a positive-strand RNA virus.</article-title>
                    <source>

                        <italic toggle="yes">Proc Natl Acad Sci U S A.</italic>
</source>
                    <year>2003</year>;<volume>100</volume>(<issue>26</issue>):<fpage>15764</fpage>&#x2013;<lpage>9</lpage>.
                    <pub-id pub-id-type="pmid">14671320</pub-id>
                    <pub-id pub-id-type="doi">10.1073/pnas.2536857100</pub-id>
                    <pub-id pub-id-type="pmcid">307642</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-14">
                <label>14</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ahlquist</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Noueiry</surname>
                            <given-names>AO</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lee</surname>
                            <given-names>WM</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Host Factors in Positive-Strand RNA Virus Genome Replication.</article-title>
                    <source>

                        <italic toggle="yes">J Virol.</italic>
</source>
                    <year>2003</year>;<volume>77</volume>(<issue>15</issue>):<fpage>8181</fpage>&#x2013;<lpage>6</lpage>.
                    <pub-id pub-id-type="pmid">12857886</pub-id>
                    <pub-id pub-id-type="doi">10.1128/jvi.77.15.8181-8186.2003</pub-id>
                    <pub-id pub-id-type="pmcid">165243</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-15">
                <label>15</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Alves-Rodrigues</surname>
                            <given-names>I</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Gal&#x00e3;o</surname>
                            <given-names>RP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Meyerhans</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>
                        <italic toggle="yes">Saccharomyces cerevisiae</italic>: A useful model host to study fundamental biology of viral replication.</article-title>
                    <source>

                        <italic toggle="yes">Virus Res.</italic>
</source>
                    <year>2006</year>;<volume>120</volume>(<issue>1&#x2013;2</issue>):<fpage>49</fpage>&#x2013;<lpage>56</lpage>.
                    <pub-id pub-id-type="pmid">16698107</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.virusres.2005.11.018</pub-id>
                    <pub-id pub-id-type="pmcid">7114155</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-16">
                <label>16</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Pogany</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Panavas</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Serviene</surname>
                            <given-names>E</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A high-throughput approach for studying virus replication in yeast.</article-title>
                    <source>

                        <italic toggle="yes">Curr Protoc Microbiol.</italic>
</source>
                    <year>2010</year>; Chapter 16:Unit16J.1.
                    <pub-id pub-id-type="pmid">21053256</pub-id>
                    <pub-id pub-id-type="doi">10.1002/9780471729259.mc16j01s19</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-17">
                <label>17</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Compton</surname>
                            <given-names>JL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zamir</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Szalay</surname>
                            <given-names>AA</given-names>
                        </name>
</person-group>:
                    <article-title>Insertion of nonhomologous DNA into the yeast genome mediated by homologous recombination with a cotransforming plasmid.</article-title>
                    <source>

                        <italic toggle="yes">Mol Gen Genet.</italic>
</source>
                    <year>1982</year>;<volume>188</volume>(<issue>1</issue>):<fpage>44</fpage>&#x2013;<lpage>50</lpage>.
                    <pub-id pub-id-type="pmid">6294480</pub-id>
                    <pub-id pub-id-type="doi">10.1007/BF00332994</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-18">
                <label>18</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ji</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Chen</surname>
                            <given-names>X</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Identification of novel bat coronaviruses sheds light on the evolutionary origins of SARS-CoV-2 and related viruses.</article-title>
                    <source>

                        <italic toggle="yes">Cell.</italic>
</source>
                    <year>2021</year>;<volume>184</volume>(<issue>17</issue>):<fpage>4380</fpage>&#x2013;<lpage>4391.e14</lpage>.
                    <pub-id pub-id-type="pmid">34147139</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.cell.2021.06.008</pub-id>
                    <pub-id pub-id-type="pmcid">8188299</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-19">
                <label>19</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kent</surname>
                            <given-names>WJ</given-names>
                        </name>
</person-group>:
                    <article-title>BLAT--The BLAST-Like Alignment Tool.</article-title>
                    <source>

                        <italic toggle="yes">Genome Res.</italic>
</source>
                    <year>2002</year>;<volume>12</volume>(<issue>4</issue>):<fpage>656</fpage>&#x2013;<lpage>64</lpage>.
                    <pub-id pub-id-type="pmid">11932250</pub-id>
                    <pub-id pub-id-type="doi">10.1101/gr.229202</pub-id>
                    <pub-id pub-id-type="pmcid">187518</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-20">
                <label>20</label>
                <mixed-citation publication-type="journal">
                    <article-title>National Center for Biotechnology Information (NCBI)</article-title>. Bethesda (MD): National Library of Medicine (US), National Center for Biotechnology Information.<year>1988</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-21">
                <label>21</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Sakai</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kawachi</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Terada</surname>
                            <given-names>Y</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Two-amino acids change in the nsp4 of SARS coronavirus abolishes viral replication.</article-title>
                    <source>

                        <italic toggle="yes">Virology.</italic>
</source>
                    <year>2017</year>;<volume>510</volume>:<fpage>165</fpage>&#x2013;<lpage>74</lpage>.
                    <pub-id pub-id-type="pmid">28738245</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.virol.2017.07.019</pub-id>
                    <pub-id pub-id-type="pmcid">7111695</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-22">
                <label>22</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Coutard</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Valle</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>de Lamballerie</surname>
                            <given-names>X</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The spike glycoprotein of the new coronavirus 2019-nCoV contains a furin-like cleavage site absent in CoV of the same clade.</article-title>
                    <source>

                        <italic toggle="yes">Antiviral Res.</italic>
</source>
                    <year>2020</year>;<volume>176</volume>:<fpage>104742</fpage>.
                    <pub-id pub-id-type="pmid">32057769</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.antiviral.2020.104742</pub-id>
                    <pub-id pub-id-type="pmcid">7114094</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-23">
                <label>23</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Papa</surname>
                            <given-names>G</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mallery</surname>
                            <given-names>DL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Albecka</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Furin cleavage of SARS-CoV-2 Spike promotes but is not essential for infection and cell-cell fusion.</article-title>
                    <source>

                        <italic toggle="yes">PLoS Pathog.</italic>
</source>
                    <year>2021</year>;<volume>17</volume>(<issue>1</issue>):<fpage>e1009246</fpage>.
                    <pub-id pub-id-type="pmid">33493182</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.ppat.1009246</pub-id>
                    <pub-id pub-id-type="pmcid">7861537</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-24">
                <label>24</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Theuerkauf</surname>
                            <given-names>SA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Michels</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Riechert</surname>
                            <given-names>V</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Quantitative assays reveal cell fusion at minimal levels of SARS-CoV-2 spike protein and fusion from without.</article-title>
                    <source>

                        <italic toggle="yes">iScience.</italic>
</source>
                    <year>2021</year>;<volume>24</volume>(<issue>3</issue>):<fpage>102170</fpage>.
                    <pub-id pub-id-type="pmid">33585805</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.isci.2021.102170</pub-id>
                    <pub-id pub-id-type="pmcid">7871100</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-25">
                <label>25</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Huang</surname>
                            <given-names>X</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>W</given-names>
                        </name>
</person-group>:
                    <article-title>A time-efficient, linear-space local similarity algorithm.</article-title>
                    <source>

                        <italic toggle="yes">Adv Appl Math.</italic>
</source>
                    <year>1991</year>;<volume>12</volume>(<issue>3</issue>):<fpage>337</fpage>&#x2013;<lpage>57</lpage>.
                    <pub-id pub-id-type="doi">10.1016/0196-8858(91)90017-D</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-26">
                <label>26</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Agmon</surname>
                            <given-names>N</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Pur</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Liefshitz</surname>
                            <given-names>B</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Analysis of repair mechanism choice during homologous recombination.</article-title>
                    <source>

                        <italic toggle="yes">Nucleic Acids Res.</italic>
</source>
                    <year>2009</year>;<volume>37</volume>(<issue>15</issue>):<fpage>5081</fpage>&#x2013;<lpage>92</lpage>.
                    <pub-id pub-id-type="pmid">19553188</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gkp495</pub-id>
                    <pub-id pub-id-type="pmcid">2731894</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-27">
                <label>27</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Pronk</surname>
                            <given-names>JT</given-names>
                        </name>
</person-group>:
                    <article-title>Auxotrophic yeast strains in fundamental and applied research.</article-title>
                    <source>

                        <italic toggle="yes">Appl Environ Microbiol.</italic>
</source>
                    <year>2002</year>;<volume>68</volume>(<issue>5</issue>):<fpage>2095</fpage>&#x2013;<lpage>100</lpage>.
                    <pub-id pub-id-type="pmid">11976076</pub-id>
                    <pub-id pub-id-type="doi">10.1128/AEM.68.5.2095-2100.2002</pub-id>
                    <pub-id pub-id-type="pmcid">127579</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-28">
                <label>28</label>
                <mixed-citation publication-type="journal">
                    <article-title>Commonly used auxotrophic markers. </article-title>SGD-Wiki. [cited 2021 Jun 3].
                    <ext-link ext-link-type="uri" xlink:href="https://wiki.yeastgenome.org/index.php/Commonly_used_auxotrophic_markers">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-29">
                <label>29</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Nooraei</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bahrulolum</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hoseini</surname>
                            <given-names>ZS</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Virus-like particles: preparation, immunogenicity and their roles as nanovaccines and drug nanocarriers.</article-title>
                    <source>

                        <italic toggle="yes">J Nanobiotechnology.</italic>
</source>
                    <year>2021</year>;<volume>19</volume>(<issue>1</issue>):<fpage>59</fpage>.
                    <pub-id pub-id-type="pmid">33632278</pub-id>
                    <pub-id pub-id-type="doi">10.1186/s12951-021-00806-7</pub-id>
                    <pub-id pub-id-type="pmcid">7905985</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-30">
                <label>30</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sun</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Su</surname>
                            <given-names>H</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>SARS coronavirus without reservoir originated from an unnatural evolution, experienced the reverse evolution, and finally disappeared in the world.</article-title>
                    <source>

                        <italic toggle="yes">Chin Med J (Engl).</italic>
</source>
                    <year>2014</year>;<volume>127</volume>(<issue>13</issue>):<fpage>2537</fpage>&#x2013;<lpage>42</lpage>.
                    <pub-id pub-id-type="pmid">24985597</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-31">
                <label>31</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jimenez-Guarde&#x00f1;o</surname>
                            <given-names>JM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Regla-Nava</surname>
                            <given-names>JA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nieto-Torres</surname>
                            <given-names>JL</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Identification of the Mechanisms Causing Reversion to Virulence in an Attenuated SARS-CoV for the Design of a Genetically Stable Vaccine.</article-title>
                    <source>

                        <italic toggle="yes">PLoS Pathog.</italic>
</source>
                    <year>2015</year>;<volume>11</volume>(<issue>10</issue>):<fpage>e1005215</fpage>.
                    <pub-id pub-id-type="pmid">26513244</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.ppat.1005215</pub-id>
                    <pub-id pub-id-type="pmcid">4626112</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-32">
                <label>32</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Pereson</surname>
                            <given-names>MJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mojsiejczuk</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mart&#x00ed;nez</surname>
                            <given-names>AP</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Phylogenetic analysis of SARS-CoV-2 in the first few months since its emergence.</article-title>
                    <source>

                        <italic toggle="yes">J Med Virol.</italic>
</source>
                    <year>2021</year>;<volume>93</volume>(<issue>3</issue>):<fpage>1722</fpage>&#x2013;<lpage>31</lpage>.
                    <pub-id pub-id-type="pmid">32966646</pub-id>
                    <pub-id pub-id-type="doi">10.1002/jmv.26545</pub-id>
                    <pub-id pub-id-type="pmcid">7537150</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-33">
                <label>33</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Lisewski</surname>
                            <given-names>AM</given-names>
                        </name>
</person-group>:
                    <article-title>Differential enrichment of yeast DNA in SARS-CoV-2 and related genomes supports synthetic origin hypothesis</article-title>. Harvard Dataverse, V1, UNF: 6:BC1twHAk9jEwqcRfghK4Dg== [fileUNF].<year>2021</year>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.doi.org/10.7910/DVN/BK8AL6">http://www.doi.org/10.7910/DVN/BK8AL6</ext-link>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
</article>
