<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="data-paper" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.11859.2</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Data Note</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                    <subj-group>
                        <subject>Genomics</subject>
                    </subj-group>
                    <subj-group>
                        <subject>Plant Genomes &amp; Evolution</subject>
                    </subj-group>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Draft genome sequencing of the sugarcane hybrid SP80-3280</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 2; peer review: 2 approved]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Ria&#x00f1;o-Pach&#x00f3;n</surname>
                        <given-names>Diego Mauricio</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0001-9803-3465</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Mattiello</surname>
                        <given-names>Lucia</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Current address: Laboratory of Regulatory Systems Biology, Department of Biochemistry, Institute of Chemistry, University of S&#x00e3;o Paulo, S&#x00e3;o Paulo, SP, Brazil</aff>
                <aff id="a2">
                    <label>2</label>Brazilian Bioethanol Science and Technology Laboratory (CTBE), Brazilian Center for Research in Energy and Materials (CNPEM), Campinas, SP, Brazil</aff>
                <aff id="a3">
                    <label>3</label>Current address: Functional Genome Laboratory, Department of Genetics, Evolution and Bioagents, Institute of Biology, State University of Campinas, Campinas, SP, Brazil</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:diriano@gmail.com">diriano@gmail.com</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>3</day>
                <month>7</month>
                <year>2017</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2017</year>
            </pub-date>
            <volume>6</volume>
            <elocation-id>861</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>29</day>
                    <month>6</month>
                    <year>2017</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2017 Ria&#x00f1;o-Pach&#x00f3;n DM and Mattiello L</copyright-statement>
                <copyright-year>2017</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/6-861/pdf"/>
            <abstract>
                <p>Sugarcane commercial cultivar SP80-3280 has been used as a model for genomic analyses in Brazil. Here we present a draft genome sequence employing Illumina TruSeq Synthetic Long reads. The dataset is available from NCBI BioProject with accession 
                    <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA272769">PRJNA272769</ext-link>.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>sugarcane</kwd>
                <kwd>long reads</kwd>
                <kwd>polyploid</kwd>
                <kwd>genomics</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1">
                    <funding-source>Centro Nacional de Processamento de Alto Desempenho em S&#x00e3;o Paulo</funding-source>
                    <award-id>UNICAMP/FINEP-MCT</award-id>
                </award-group>
                <award-group id="fund-2">
                    <funding-source>Funda&#x00e7;&#x00e3;o de Amparo &#x00e0; Pesquisa do Estado de S&#x00e3;o Paulo</funding-source>
                    <award-id>2012/23345-0</award-id>
                </award-group>
                <award-group id="fund-3">
                    <funding-source>Brazilian Bioethanol Science and Technology Laboratory</funding-source>
                </award-group>
                <funding-statement>This work was supported by institutional funds from CTBE/CNPEM to DMRP and a Funda&#x00e7;&#x00e3;o de Amparo &#x00e0; Pesquisa do Estado de S&#x00e3;o Paulo (FAPESP) grant to LM (2012/23345-0). The research was developed with support from CENAPAD-SP (Centro Nacional de Processamento de Alto Desempenho em S&#x00e3;o Paulo), project UNICAMP/FINEP-MCT.</funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Revised</label>
                <title>Amendments from Version 1</title>
                <p>We fixed some spelling mistakes and added information and links about the genome annotation of sugarcane cultivar SP80-3280</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec sec-type="intro">
            <title>Introduction</title>
            <p>Sugarcane is an economically important crop used as source of sugar, ethanol and electricity generation
                <sup>
                    <xref ref-type="bibr" rid="ref-1">1</xref>
                </sup>. Sugarcane has a haploid genome of ~1Gpb, however, modern sugarcane cultivars are polyploids derived from interspecific hybridization between 
                <italic toggle="yes">S. officinarum</italic> L. and 
                <italic toggle="yes">S. spontaneum</italic> L., reaching up to 130 chromosomes distributed among ~12 homo(eo)logous groups
                <sup>
                    <xref ref-type="bibr" rid="ref-2">2</xref>,
                    <xref ref-type="bibr" rid="ref-3">3</xref>
                </sup>, with a total genome size reaching 10Gpb
                <sup>
                    <xref ref-type="bibr" rid="ref-4">4</xref>
                </sup>. Its complex genome structure has hampered genome sequencing, assembly and annotation. Partial genomic sequences are available
                <sup>
                    <xref ref-type="bibr" rid="ref-5">5</xref>&#x2013;
                    <xref ref-type="bibr" rid="ref-8">8</xref>
                </sup>, as well as transcriptome sequences
                <sup>
                    <xref ref-type="bibr" rid="ref-9">9</xref>&#x2013;
                    <xref ref-type="bibr" rid="ref-11">11</xref>
                </sup>, but there are no whole genome assemblies available to date. Here we used the Illumina TruSeq Synthetic Long Read sequencing technology to survey the genome of the polyploid cultivar SP80-3280. The generated long reads, their assembly and genome annotation have been made public and will provide useful information for functional genomics studies.</p>
        </sec>
        <sec sec-type="materials | methods">
            <title>Materials and methods</title>
            <p>The leaf rolls of greenhouse grown, two-month old plants of sugarcane cultivar SP80-3280 (provided by Centro de Tecnologia Canavieira, Piracicaba, S&#x00e3;o Paulo), were collected and immediately frozen in liquid nitrogen. The plant tissue was ground up to become fine powder, and high molecular weight DNA was extracted from 100 mg of fresh frozen tissue using CTAB (Sigma-Aldrich, USA) and chloroform:isoamyl alcohol (Sigma-Aldrich, USA) as previously described
                <sup>
                    <xref ref-type="bibr" rid="ref-12">12</xref>
                </sup>. 6&#x00b5;g of DNA were sent to Illumina (CA, USA) for DNA sequencing using TruSeq Synthetic long read technology
                <sup>
                    <xref ref-type="bibr" rid="ref-13">13</xref>
                </sup>, through their FastTrack Sequencing Service. Sequencing was performed on an Illumina HiSeq2000 system using paired-end chemistry. Nine long read libraries, each generating approx. 600Mbps, were generated, giving an estimated coverage between 4 and 5 of the monoploid genome. A total of 1,378,917 reads longer than 1.5Kbp, or 5,642,855,018 bases, were generated. The underlying 1,966,604,928 short reads amount to 393,320,985,600bp, which would translate to an estimated coverage of 393x of the haploid genome. The maximum read length was 20,918bp, with 36% of the reads being longer than 4.5Kbp. Possible contaminants were removed by comparison against the NCBI&#x2019;s nucleotide database using BLAST
                <sup>
                    <xref ref-type="bibr" rid="ref-14">14</xref>
                </sup>, keeping only the long reads with best hits against Viridiplantae, resulting in 1,224,061 useful for assembly. Prior to assembly, long reads originating from mitochondria (NC_008360.1) and chloroplast (NC_005878.2) were excluded using mirabait (
                <ext-link ext-link-type="uri" xlink:href="https://sourceforge.net/projects/mira-assembler/">http://mira-assembler.sourceforge.net/</ext-link>). Reads longer than 1.5Kbp were assembled using Celera&#x2019;s WGS Assembler v8.2
                <sup>
                    <xref ref-type="bibr" rid="ref-15">15</xref>
                </sup>, using similar parameters as previously described
                <sup>
                    <xref ref-type="bibr" rid="ref-13">13</xref>
                </sup>, except for some of the error parameters that were left in their default settings, i.e., 
                <monospace>&#x2018;unitiger=bogart, merSize=31, ovlMinLen=100&#x2019;,</monospace> and the parameters 
                <monospace>ovlErrorRate, cnsErrorRate, cgwErrorRate, utgGraphErrorRate, utgGraphErrorLimit, utgMergeErrorRate, utgMergeErrorLimit.</monospace> A non-redundant assembly was created using CD-HIT
                <sup>
                    <xref ref-type="bibr" rid="ref-16">16</xref>
                </sup>, merging 100% identical sequences and sub-sequences. RNASeq data previously generated in our group
                <sup>
                    <xref ref-type="bibr" rid="ref-17">17</xref>
                </sup> for the same cultivar was exploited for gene prediction using BRAKER1
                <sup>
                    <xref ref-type="bibr" rid="ref-18">18</xref>
                </sup> and PASA
                <sup>
                    <xref ref-type="bibr" rid="ref-19">19</xref>
                </sup>, as well as sugarcane transcript data (ESTs), and 
                <italic toggle="yes">Sorghum bicolor</italic> proteins using Exonerate
                <sup>
                    <xref ref-type="bibr" rid="ref-20">20</xref>
                </sup>, all gene evidence was integrated to generate a high quality gene prediction set with Evidence Modeller
                <sup>
                    <xref ref-type="bibr" rid="ref-21">21</xref>
                </sup>, leading to 153,078 predicted protein-coding genes.</p>
        </sec>
        <sec>
            <title>Data availability</title>
            <p>Raw sequencing data are available at NCBI SRA; the long reads with accession number SRX845504, and the underlying short reads with accessions SRX853961 to SRX853969. The SP80-3280 assembly is available with accession number GCA_002018215.1. All data can be found under the BioProject 
                <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA272769">PRJNA272769</ext-link>. Genome annotation is available from 
                <ext-link ext-link-type="uri" xlink:href="https://figshare.com/projects/Sugarcane_SP80-3280_draft_genome_annotation/22327">https://figshare.com/projects/Sugarcane_SP80-3280_draft_genome_annotation/22327</ext-link>
            </p>
        </sec>
    </body>
    <back>
        <ack>
            <title>Acknowledgements</title>
            <p>The authors are grateful to Larissa Prado da Cruz (CTBE/CNPEM) for assistance with molecular biology procedures.</p>
        </ack>
        <ref-list>
            <ref id="ref-1">
                <label>1</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Long</surname>
                            <given-names>SP</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Karp</surname>
                            <given-names>A</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Buckeridge</surname>
                            <given-names>MS</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Feedstocks for Biofuels and Bioenergy</article-title>. In
                    <italic toggle="yes">Bioenergy &amp; Sustainability: bridging the gaps</italic>. (eds. Souza GM, Victoria RL, Joly CA &amp; Verdade LM), UNESCO.<year>2015</year>;<fpage>302</fpage>&#x2013;<lpage>347</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://bioenfapesp.org/scopebioenergy/images/chapters/bioen-scope_chapter10.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-2">
                <label>2</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Grivet</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Arruda</surname>
                            <given-names>P</given-names>
                        </name>
					</person-group>:
                    <article-title>Sugarcane genomics: depicting the complex genome of an important tropical crop.</article-title>
                    <source>
						
                        <italic toggle="yes">Curr Opin Plant Biol.</italic>
					</source>
                    <year>2002</year>;<volume>5</volume>(<issue>2</issue>):<fpage>122</fpage>&#x2013;<lpage>127</lpage>.
                    <pub-id pub-id-type="pmid">11856607</pub-id>
                    <pub-id pub-id-type="doi">10.1016/S1369-5266(02)00234-0</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-3">
                <label>3</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>D&#x2019;Hont</surname>
                            <given-names>A</given-names>
                        </name>
					</person-group>:
                    <article-title>Unraveling the genome structure of polyploids using FISH and GISH; examples of sugarcane and banana.</article-title>
                    <source>
						
                        <italic toggle="yes">Cytogenet Genome Res.</italic>
					</source>
                    <year>2005</year>;<volume>109</volume>(<issue>1&#x2013;3</issue>):<fpage>27</fpage>&#x2013;<lpage>33</lpage>.
                    <pub-id pub-id-type="pmid">15753555</pub-id>
                    <pub-id pub-id-type="doi">10.1159/000082378</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-4">
                <label>4</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Le Cunff</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Garsmeur</surname>
                            <given-names>O</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Raboin</surname>
                            <given-names>LM</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Diploid/polyploid syntenic shuttle mapping and haplotype-specific chromosome walking toward a rust resistance gene (
                        <italic toggle="yes">Bru1</italic>) in highly polyploid sugarcane (2
                        <italic toggle="yes">n</italic> approximately 12
                        <italic toggle="yes">x</italic> approximately 115).</article-title>
                    <source>
						
                        <italic toggle="yes">Genetics.</italic>
					</source>
                    <year>2008</year>;<volume>180</volume>(<issue>1</issue>):<fpage>649</fpage>&#x2013;<lpage>660</lpage>.
                    <pub-id pub-id-type="pmid">18757946</pub-id>
                    <pub-id pub-id-type="doi">10.1534/genetics.108.091355</pub-id>
                    <pub-id pub-id-type="pmcid">2535714</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-5">
                <label>5</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>JR</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Dilley</surname>
                            <given-names>KA</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Harkins</surname>
                            <given-names>DM</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Initial genome sequencing of the sugarcane CP 96-1252 complex hybrid [version 1; referees: 1 approved].</article-title>
                    <source>
						
                        <italic toggle="yes">F1000Res.</italic>
					</source>
                    <year>2017</year>;<volume>6</volume>:<fpage>688</fpage>.
                    <pub-id pub-id-type="doi">10.12688/f1000research.11629.1</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-6">
                <label>6</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Grativol</surname>
                            <given-names>C</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Regulski</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Bertalan</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Sugarcane genome sequencing by methylation filtration provides tools for genomic research in the genus 
                        <italic toggle="yes">Saccharum</italic>.</article-title>
                    <source>
						
                        <italic toggle="yes">Plant J.</italic>
					</source>
                    <year>2014</year>;<volume>79</volume>(<issue>1</issue>):<fpage>162</fpage>&#x2013;<lpage>172</lpage>.
                    <pub-id pub-id-type="pmid">24773339</pub-id>
                    <pub-id pub-id-type="doi">10.1111/tpj.12539</pub-id>
                    <pub-id pub-id-type="pmcid">4458261</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-7">
                <label>7</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Okura</surname>
                            <given-names>VK</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>de Souza</surname>
                            <given-names>RS</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>de Siqueira Tada</surname>
                            <given-names>SF</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>BAC-Pool Sequencing and Assembly of 19 Mb of the Complex Sugarcane Genome.</article-title>
                    <source>
						
                        <italic toggle="yes">Front Plant Sci.</italic>
					</source>
                    <year>2016</year>;<volume>7</volume>:<fpage>342</fpage>.
                    <pub-id pub-id-type="pmid">27047520</pub-id>
                    <pub-id pub-id-type="doi">10.3389/fpls.2016.00342</pub-id>
                    <pub-id pub-id-type="pmcid">4804495</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-8">
                <label>8</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>de Setta</surname>
                            <given-names>N</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Monteiro-Vitorello</surname>
                            <given-names>CB</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Metcalfe</surname>
                            <given-names>CJ</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Building the sugarcane genome for biotechnology and identifying evolutionary trends.</article-title>
                    <source>
						
                        <italic toggle="yes">BMC Genomics.</italic>
					</source>
                    <year>2014</year>;<volume>15</volume>(<issue>1</issue>):<fpage>540</fpage>.
                    <pub-id pub-id-type="pmid">24984568</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2164-15-540</pub-id>
                    <pub-id pub-id-type="pmcid">4122759</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-9">
                <label>9</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Mattiello</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Ria&#x00f1;o-Pach&#x00f3;n</surname>
                            <given-names>DM</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Martins</surname>
                            <given-names>MC</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Physiological and transcriptional analyses of developmental stages along sugarcane leaf.</article-title>
                    <source>
						
                        <italic toggle="yes">BMC Plant Biol.</italic>
					</source>
                    <year>2015</year>;<volume>15</volume>:<fpage>300</fpage>.
                    <pub-id pub-id-type="pmid">26714767</pub-id>
                    <pub-id pub-id-type="doi">10.1186/s12870-015-0694-z</pub-id>
                    <pub-id pub-id-type="pmcid">4696237</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-10">
                <label>10</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Hoang</surname>
                            <given-names>NV</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Furtado</surname>
                            <given-names>A</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Mason</surname>
                            <given-names>PJ</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>A survey of the complex transcriptome from the highly polyploid sugarcane genome using full-length isoform sequencing and 
                        <italic toggle="yes">de novo</italic> assembly from short read sequencing.</article-title>
                    <source>
						
                        <italic toggle="yes">BMC Genomics.</italic>
					</source>
                    <year>2017</year>;<volume>18</volume>(<issue>1</issue>):<fpage>395</fpage>.
                    <pub-id pub-id-type="pmid">28532419</pub-id>
                    <pub-id pub-id-type="doi">10.1186/s12864-017-3757-8</pub-id>
                    <pub-id pub-id-type="pmcid">5440902</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-11">
                <label>11</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Belesini</surname>
                            <given-names>AA</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Carvalho</surname>
                            <given-names>FMS</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Telles</surname>
                            <given-names>BR</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>
                        <italic toggle="yes">De novo</italic> transcriptome assembly of sugarcane leaves submitted to prolonged water-deficit stress.</article-title>
                    <source>
						
                        <italic toggle="yes">Genet Mol Res.</italic>
					</source>
                    <year>2017</year>;<volume>16</volume>(<issue>2</issue>).
                    <pub-id pub-id-type="pmid">28549198</pub-id>
                    <pub-id pub-id-type="doi">10.4238/gmr16028845</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-12">
                <label>12</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Porebski</surname>
                            <given-names>S</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Bailey</surname>
                            <given-names>LG</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Baum</surname>
                            <given-names>BR</given-names>
                        </name>
					</person-group>:
                    <article-title>Modification of a CTAB DNA extraction protocol for plants containing high polysaccharide and polyphenol components.</article-title>
                    <source>
						
                        <italic toggle="yes">Plant Mol Biol Rep.</italic>
					</source>
                    <year>1997</year>;<volume>15</volume>(<issue>1</issue>):<fpage>8</fpage>&#x2013;<lpage>15</lpage>.
                    <pub-id pub-id-type="doi">10.1007/BF02772108</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-13">
                <label>13</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>McCoy</surname>
                            <given-names>RC</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Taylor</surname>
                            <given-names>RW</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Blauwkamp</surname>
                            <given-names>TA</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Illumina TruSeq synthetic long-reads empower 
                        <italic toggle="yes">de novo</italic> assembly and resolve complex, highly-repetitive transposable elements.</article-title>
                    <source>
						
                        <italic toggle="yes">PLoS One.</italic>
					</source>
                    <year>2014</year>;<volume>9</volume>(<issue>9</issue>):<fpage> e106689</fpage>.
                    <pub-id pub-id-type="pmid">25188499</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0106689</pub-id>
                    <pub-id pub-id-type="pmcid">4154752</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-14">
                <label>14</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Altschul</surname>
                            <given-names>SF</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Gish</surname>
                            <given-names>W</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Miller</surname>
                            <given-names>W</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Basic local alignment search tool.</article-title>
                    <source>
						
                        <italic toggle="yes">J Mol Biol.</italic>
					</source>
                    <year>1990</year>;<volume>215</volume>(<issue>3</issue>):<fpage> 403</fpage>&#x2013;<lpage>410</lpage>.
                    <pub-id pub-id-type="pmid">2231712</pub-id>
                    <pub-id pub-id-type="doi">10.1016/S0022-2836(05)80360-2</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-15">
                <label>15</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
					
                        <name name-style="western">
                            <surname>Myers</surname>
                            <given-names>EW</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Sutton</surname>
                            <given-names>GG</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Delcher</surname>
                            <given-names>AL</given-names>
                        </name>
					
                        <etal/>
				</person-group>:
                    <article-title>A Whole-Genome Assembly of 
                        <italic toggle="yes">Drosophila.</italic>
				</article-title>
                    <source>
					
                        <italic toggle="yes">Science.</italic>
				</source>
                    <year>2000</year>;<volume>287</volume>(<issue>5461</issue>):<fpage>2196</fpage>&#x2013;<lpage>2204</lpage>.
                    <pub-id pub-id-type="pmid">10731133</pub-id>
                    <pub-id pub-id-type="doi">10.1126/science.287.5461.2196</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-16">
                <label>16</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Fu</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Niu</surname>
                            <given-names>B</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>Z</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>CD-HIT: accelerated for clustering the next-generation sequencing data.</article-title>
                    <source>
						
                        <italic toggle="yes">Bioinformatics.</italic>
					</source>
                    <year>2012</year>;<volume>28</volume>(<issue>23</issue>):<fpage> 3150</fpage>&#x2013;<lpage>3152</lpage>.
                    <pub-id pub-id-type="pmid">23060610</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/bts565</pub-id>
                    <pub-id pub-id-type="pmcid">3516142</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-17">
                <label>17</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Ria&#x00f1;o-Pach&#x00f3;n</surname>
                            <given-names>DM</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Mattiello</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Cruz</surname>
                            <given-names>LP</given-names>
                        </name>
						</person-group>:
                    <article-title>Surveying the complex polyploid sugarcane genome sequence using synthetic long reads</article-title>. Technical Memorandum Centro Nacional de Pesquisa em Energia e Materiais.<year>2016</year>.
                    <pub-id pub-id-type="doi">10.13140/RG.2.1.3468.0565</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-18">
                <label>18</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
					
                        <name name-style="western">
                            <surname>Hoff</surname>
                            <given-names>KJ</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Lange</surname>
                            <given-names>S</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Lomsadze</surname>
                            <given-names>A</given-names>
                        </name>
					
                        <etal/>
				</person-group>:
                    <article-title>BRAKER1: Unsupervised RNA-Seq-Based Genome Annotation with GeneMark-ET and AUGUSTUS.</article-title>
                    <source>
					
                        <italic toggle="yes">Bioinformatics.</italic>
				</source>
                    <year>2016</year>;<volume>32</volume>(<issue>5</issue>):<fpage>767</fpage>&#x2013;<lpage>9</lpage>.
                    <pub-id pub-id-type="pmid">26559507</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btv661</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-19">
                <label>19</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
					
                        <name name-style="western">
                            <surname>Haas</surname>
                            <given-names>BJ</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Delcher</surname>
                            <given-names>AL</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Mount</surname>
                            <given-names>SM</given-names>
                        </name>
					
                        <etal/>
				</person-group>:
                    <article-title>Improving the 
                        <italic toggle="yes">Arabidopsis</italic> genome annotation using maximal transcript alignment assemblies.</article-title>
                    <source>
					
                        <italic toggle="yes">Nucleic Acids Res.</italic>
				</source>
                    <year>2003</year>;<volume>31</volume>(<issue>19</issue>):<fpage>5654</fpage>&#x2013;<lpage>66</lpage>.
                    <pub-id pub-id-type="pmid">14500829</pub-id>
                    <pub-id pub-id-type="doi">10.1093/nar/gkg770</pub-id>
                    <pub-id pub-id-type="pmcid">206470</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-20">
                <label>20</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
					
                        <name name-style="western">
                            <surname>Slater</surname>
                            <given-names>GS</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Birney</surname>
                            <given-names>E</given-names>
                        </name>
				</person-group>:
                    <article-title>Automated generation of heuristics for biological sequence comparison.</article-title>
                    <source>
					
                        <italic toggle="yes">BMC Bioinformatics.</italic>
				</source>
                    <year>2005</year>;<volume>6</volume>:<fpage>31</fpage>.
                    <pub-id pub-id-type="pmid">15713233</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-6-31</pub-id>
                    <pub-id pub-id-type="pmcid">553969</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-21">
                <label>21</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
					
                        <name name-style="western">
                            <surname>Haas</surname>
                            <given-names>BJ</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Salzberg</surname>
                            <given-names>SL</given-names>
                        </name>
					
                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>W</given-names>
                        </name>
					
                        <etal/>
				</person-group>:
                    <article-title>Automated eukaryotic gene structure annotation using EVidenceModeler  and the Program to Assemble Spliced Alignments.</article-title>
                    <source>
					
                        <italic toggle="yes">Genome Biol.</italic>
				</source>
                    <year>2008</year>;<volume>9</volume>(<issue>1</issue>):<fpage>R7</fpage>.
                    <pub-id pub-id-type="pmid">18190707</pub-id>
                    <pub-id pub-id-type="doi">10.1186/gb-2008-9-1-r7</pub-id>
                    <pub-id pub-id-type="pmcid">2395244</pub-id>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report23980">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.13012.r23980</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Mohan</surname>
                        <given-names>Chakravarthi</given-names>
                    </name>
                    <xref ref-type="aff" rid="r23980a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-4494-7699</uri>
                </contrib>
                <aff id="r23980a1">
                    <label>1</label>Department of Genetics and Evolution, Federal University of S&#x00e3;o Carlos, S&#x00e3;o Carlos, Brazil</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>1</day>
                <month>8</month>
                <year>2017</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2017 Mohan C</copyright-statement>
                <copyright-year>2017</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport23980" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.11859.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>No further comments.</p>
            <p>Are sufficient details of methods and materials provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Is the rationale for creating the dataset(s) clearly described?</p>
            <p>Yes</p>
            <p>Are the datasets clearly presented in a useable and accessible format?</p>
            <p>Yes</p>
            <p>Are the protocols appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Sugarcane genetic engineering, transcriptomics</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report23667">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.12814.r23667</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Mohan</surname>
                        <given-names>Chakravarthi</given-names>
                    </name>
                    <xref ref-type="aff" rid="r23667a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-4494-7699</uri>
                </contrib>
                <aff id="r23667a1">
                    <label>1</label>Department of Genetics and Evolution, Federal University of S&#x00e3;o Carlos, S&#x00e3;o Carlos, Brazil</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>21</day>
                <month>6</month>
                <year>2017</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2017 Mohan C</copyright-statement>
                <copyright-year>2017</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport23667" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.11859.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The data note entitled '
                <ext-link ext-link-type="uri" xlink:href="https://f1000research.com/articles/6-861/v1">Draft genome sequencing of the sugarcane hybrid SP80-3280</ext-link>' is perhaps the first report describing the whole genome of sugarcane, a complex polyploid and its availability in NCBI will be a boon to sugarcane researchers.</p>
            <p> </p>
            <p> The study is well planned, executed and well drafted. The data presented here would be particularly useful for functional genomic studies in sugarcane.</p>
            <p>Are sufficient details of methods and materials provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Is the rationale for creating the dataset(s) clearly described?</p>
            <p>Yes</p>
            <p>Are the datasets clearly presented in a useable and accessible format?</p>
            <p>Yes</p>
            <p>Are the protocols appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Sugarcane genetic engineering, transcriptomics</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
        <sub-article article-type="response" id="comment2833-23667">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Ria&#x00f1;o-Pach&#x00f3;n</surname>
                            <given-names>Diego Mauricio</given-names>
                        </name>
                        <aff>University of S&#x00e3;o Paulo, Brazil</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>23</day>
                    <month>6</month>
                    <year>2017</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear Dr. Mohan,</p>
                <p> </p>
                <p> thanks you for your review of our data note. In version 2 of the note we have added links for the genome annotation in addition to the genome assembly.</p>
                <p> </p>
                <p> Best regards,</p>
                <p> </p>
                <p> Diego</p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report23398">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.12814.r23398</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Miller</surname>
                        <given-names>Jason</given-names>
                    </name>
                    <xref ref-type="aff" rid="r23398a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-6912-2925</uri>
                </contrib>
                <aff id="r23398a1">
                    <label>1</label>J. Craig Venter Institute, Rockville, MD, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>15</day>
                <month>6</month>
                <year>2017</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2017 Miller J</copyright-statement>
                <copyright-year>2017</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport23398" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.11859.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>Summary:</p>
            <p> </p>
            <p> The Data Note, "Draft genome sequencing of the sugarcane hybrid SP80-3280",&#x00a0;describes a sugarcane genome assembly that is available at NCBI. The TruSeq method was applied to a monoploid sugarcane cultivar to generate a 1.2 gigabase assembly with a 8433 contig N50 according to GenBank. This is the first sugarcane genome assembly so it will be of interest to the field. This data note is especially useful because it describes the sequence filtering by size, blast, mirabit, and cd-hit prior to release.</p>
            <p> Suggestions:</p>
            <p> The sentence, &#x201c;there are not whole genome assemblies available&#x201d;, probably should say &#x201c;there are no whole genome assemblies available&#x201d;. The text could be made clearer by presenting all the statics for underlying short reads before getting to the synthetic long read stats, and by specifying that the blast filter was applied to the long reads. I would appreciate a reference for Celera Assembler, but that is just me.</p>
            <p>Are sufficient details of methods and materials provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Is the rationale for creating the dataset(s) clearly described?</p>
            <p>Yes</p>
            <p>Are the datasets clearly presented in a useable and accessible format?</p>
            <p>Yes</p>
            <p>Are the protocols appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Genome assembly</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard.</p>
        </body>
        <sub-article article-type="response" id="comment2832-23398">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Ria&#x00f1;o-Pach&#x00f3;n</surname>
                            <given-names>Diego Mauricio</given-names>
                        </name>
                        <aff>University of S&#x00e3;o Paulo, Brazil</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>23</day>
                    <month>6</month>
                    <year>2017</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear Dr. Miller,</p>
                <p> </p>
                <p> thank you very much for your review of our data note. We have followed your main suggestions, and they are available as version 2 of the data note.</p>
                <p> </p>
                <p> Best regards,</p>
                <p> </p>
                <p> Diego</p>
            </body>
        </sub-article>
    </sub-article>
</article>
