<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="methods-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.6391.1</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Method Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                    <subj-group>
                        <subject>Bioinformatics</subject>
                    </subj-group>
                    <subj-group>
                        <subject>Genomics</subject>
                    </subj-group>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Signal-processing tools for core-collection selection from genetic-resource collections</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 1; peer review: peer review discontinued]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Borrayo</surname>
                        <given-names>Ernesto</given-names>
                    </name>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Takeya</surname>
                        <given-names>Masaru</given-names>
                    </name>
                    <xref ref-type="corresp" rid="c2">b</xref>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Gene Research Center, University of Tsukuba, Tsukuba City, Ibaraki, 605-8572, Japan</aff>
                <aff id="a2">
                    <label>2</label>Genetic Resources Center, National Institute of Agrobiological Sciences, Tsukuba City, Ibaraki, 305-8602, Japan</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:carbajal.borrayo.gb@u.tsukuba.ac.jp">carbajal.borrayo.gb@u.tsukuba.ac.jp</email>
                </corresp>
                <corresp id="c2">
                    <label>b</label>
                    <email xlink:href="mailto:katu@affrc.go.jp">katu@affrc.go.jp</email>
                </corresp>
                <fn fn-type="con">
                    <p>EB conceived and designed the algorithm, performed the implementation, analysed the data and wrote the manuscript. MT contributed to the design of the algorithm, data analysis and manuscript drafting and correction. Both authors have read and approved the final manuscript.</p>
                </fn>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>23</day>
                <month>4</month>
                <year>2015</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2015</year>
            </pub-date>
            <volume>4</volume>
            <elocation-id>97</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>22</day>
                    <month>4</month>
                    <year>2015</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2015 Borrayo E and Takeya M</copyright-statement>
                <copyright-year>2015</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/4-97/pdf"/>
            <abstract>
                <p>Selecting a representative core collection (CC) is a proven and effective strategy for overcoming the expenses and difficulties of managing genetic resources in gene banks around the globe. Because of the diverse applications available for these sub-collections, several algorithms have been successfully implemented to construct them based on genotypic, phenotypic, passport or geographic data (either by individual datasets or by consensus). However, to the best of our knowledge, no single comprehensive dataset has been properly explored to date. Thus, researchers evaluate multiple datasets in order to construct representative CCs; this can be quite difficult, but one feasible solution for such an evaluation is to manage all available data as one discrete signal, which allows signal processing tools (SPTs) to be implemented during data analysis. In this research, we present a proof-of-concept study that shows the possibility of mapping to a discrete signal any type of data available from genetic resource collections in order to take advantage of SPTs for the construction of CCs that adequately represent the diversity of two crops. This method is referred to as &#x2018;SPT selection&#x2019;. All available information for each element of the tested collections was analysed under this perspective and compared, when possible, with one of the most used algorithms for CC selection. Genotype-only SPT selection did not prove as effective as standard CC selection algorithms; however, the SPT approach can consider genotype alongside other types of information, which results in well-represented CCs that consider both the genotypic and agromorphological diversities present in original collections. Furthermore, SPT-based analysis can evaluate all available data both in a comprehensive manner and under different perspectives, and despite its limitations, the analysis renders satisfactory results. Thus, SPT-based algorithms for CC selection can be valuable in the field of genetic resources research, management and exploitation.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Core collection</kwd>
                <kwd>Fast Fourier Transform</kwd>
                <kwd>Genetic resource management</kwd>
                <kwd>Rice</kwd>
                <kwd>Foxtail millet</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="http://dx.doi.org/10.13039/501100004532">
                    <funding-source>Japan International Cooperation Agency</funding-source>
                </award-group>
                <award-group id="fund-2" xlink:href="http://dx.doi.org/10.13039/501100002241">
                    <funding-source>Japan Science and Technology Agency</funding-source>
                </award-group>
                <award-group id="fund-3" xlink:href="http://dx.doi.org/10.13039/501100001691">
                    <funding-source>Japan Society for the Promotion of Science</funding-source>
                    <award-id>25257416</award-id>
                </award-group>
                <funding-statement>This research is supported in part by the SATREPS project by JST and JICA, Diversity Assessment and Development of Sustainable Use of Mexican Genetic Resources and in part by JSPS Grant-in-Aid 25257416.</funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
    </front>
    <body>
        <sec>
            <title>Background</title>
            <p>One of the most promising techniques for conserving the diversity of genetic resources is 
                <italic toggle="yes">ex situ</italic> genebank germoplasm collection. A significant effort has been made on a global scale to preserve, characterize, distribute and utilise genetic resources in order to understand their biological phenomena and to confront the vulnerable situation regarding the sustainability of future human development
                <sup>
                    <xref ref-type="bibr" rid="ref-1">1</xref>,
                    <xref ref-type="bibr" rid="ref-2">2</xref>
                </sup>. As the size of germoplasm collections increase, it becomes difficult to appropriately manage and extensively evaluate them
                <sup>
                    <xref ref-type="bibr" rid="ref-3">3</xref>
                </sup>; thus, the core collection (CC) concept
                <sup>
                    <xref ref-type="bibr" rid="ref-4">4</xref>
                </sup> has become a fundamental genetic resource management approach and exploits the potential of a complete collection in terms of viable data management and monetary expenses
                <sup>
                    <xref ref-type="bibr" rid="ref-5">5</xref>&#x2013;
                    <xref ref-type="bibr" rid="ref-8">8</xref>
                </sup>.</p>
            <p>Different CCs have different purposes, characteristics and evaluation criteria
                <sup>
                    <xref ref-type="bibr" rid="ref-7">7</xref>,
                    <xref ref-type="bibr" rid="ref-9">9</xref>&#x2013;
                    <xref ref-type="bibr" rid="ref-11">11</xref>
                </sup>; thus, several different algorithms and informatics tools have been developed and implemented
                <sup>
                    <xref ref-type="bibr" rid="ref-12">12</xref>&#x2013;
                    <xref ref-type="bibr" rid="ref-15">15</xref>
                </sup> with different approaches for satisfying particular needs of each CC. Because these CCs are constructed mainly on the basis of genotypic, phenotypic, passport or geographic data (either by individual datasets or by consensus)
                <sup>
                    <xref ref-type="bibr" rid="ref-16">16</xref>
                </sup>, there is a lack of all-inclusive datasets; this limits the possibility of generating a CC that may satisfy most basic and applied genetic resource research programs. To the best of our knowledge, no single comprehensive dataset has been properly explored to date. One possible method to create a comprehensive dataset is to represent the available data as numerical values. Several methods exist that represent genomic information into numerical values
                <sup>
                    <xref ref-type="bibr" rid="ref-17">17</xref>
                </sup> and agromorphological traits (ATs) into scores
                <sup>
                    <xref ref-type="bibr" rid="ref-18">18</xref>
                </sup>. Through this mapping process, treating each data vector as a discrete signal that can, in turn, be analysed by signal processing tools (SPTs) is possible, thus providing an effective tool for a comprehensive evaluation of datasets. We present a proof-of-concept study that shows the possibility of mapping to a discrete signal any type of data available from genetic resource collections in order to take advantage of SPTs for CC selections; this possibility provides new decision-making criteria for genetic resource management and research.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Mapping data</title>
                <p>Each input data must be mapped to a numerical value. This is a fundamental process of the algorithm because it enables different datasets to be analysed together, regardless of their nature. In this manner, dissimilar passport data, single nucleotide polymorphisms (SNPs), restriction fragment length polymorphisms (RFLPs), geographic information and phenotypical traits can be included in one comprehensive dataset. To consistently represent each data type, reference tables are implemented according to the nature of each particular data: genetic information (originally represented as character elements) is now represented by a numerical vector, and trait variation, simple sequence repeat (SSR) molecular markers and passport data can be represented as either binary or normalized data depending on the quantitative/qualitative nature of the data. The original data and reference tables for this study are available in 
                    <xref ref-type="other" rid="SM1">supplementary material 1</xref>. Data transformation for this study rendered a matrix containing the representation of MC samples (
                    <italic toggle="yes">i</italic>
                    <sub>1</sub>, 
                    <italic toggle="yes">i</italic>
                    <sub>2</sub>, 
                    <italic toggle="yes">i</italic>
                    <sub>3</sub>, &#x2026;
                    <italic toggle="yes">i</italic>
                    <sub>
                        <italic toggle="yes">n</italic>
                    </sub>) with (
                    <italic toggle="yes">j</italic>
                    <sub>1</sub>, 
                    <italic toggle="yes">j</italic>
                    <sub>2</sub>, 
                    <italic toggle="yes">j</italic>
                    <sub>3</sub>, &#x2026; 
                    <italic toggle="yes">j</italic>
                    <sub>
                        <italic toggle="yes">m</italic>
                    </sub>) elements each, where 
                    <italic toggle="yes">n</italic> is the total number of samples, and 
                    <italic toggle="yes">m</italic> is the number of included samples 
                    <italic toggle="yes">characteristics</italic>, represented by a numerical value as 
                    <italic toggle="yes">data</italic>
                    <sub>(
                        <italic toggle="yes">i, j</italic>)</sub>.</p>
            </sec>
            <sec>
                <title>Signal construction</title>
                <p>Numerical representations of each 
                    <italic toggle="yes">j</italic>th 
                    <italic toggle="yes">data</italic> element can be treated as frequency values in 
                    <italic toggle="yes">m data</italic> time in such a manner that each 
                    <italic toggle="yes">i</italic>th sample is treated as a discrete signal. The 
                    <italic toggle="yes">i</italic> signal corresponds to the information behaviour from each sample. This perspective will enable the implementation of SPTs such as the discrete Fourier transform and power spectrum comparison. Although SPTs can be implemented on all data available for each sample, not all data elements contain the same informativeness value to discriminate between samples. To overcome the informative difference in each 
                    <italic toggle="yes">j</italic> element of 
                    <italic toggle="yes">data</italic>, a principal component analysis (PCA) can be performed to rearrange 
                    <italic toggle="yes">data</italic> into a new matrix that has the high informative elements of 
                    <italic toggle="yes">data</italic> at the beginning and that arranges subsequent elements according to their informativeness, discarding those whose variance equals 0. This process renders two new matrices: the original 
                    <italic toggle="yes">characteristics</italic> mapped vectors matrix (
                    <italic toggle="yes">x</italic>) and rearranged variance value matrix (
                    <italic toggle="yes">X</italic>). Matrix 
                    <italic toggle="yes">X</italic>, therefore, contains 
                    <italic toggle="yes">n</italic> samples that are formed by a numerical vector with 
                    <italic toggle="yes">m</italic>=
                    <italic toggle="yes">m</italic>-(non informative 
                    <italic toggle="yes">characteristics</italic>).</p>
            </sec>
            <sec>
                <title>Fast Fourier transform</title>
                <p>The main objective of Fourier transform is the decomposition of any signal into a complex histogram of frequencies. Signal function is then represented as a vectorial function whose angle and magnitude determine a sampled point in the signal
                    <sup>
                        <xref ref-type="bibr" rid="ref-19">19</xref>
                    </sup>. The original Fourier model is expressed as follows:</p>
                <p>
                    <disp-formula id="e1">
                        <mml:math display="block" id="math1">
                            <mml:mrow>
                                <mml:mover accent="true">
                                    <mml:mi>f</mml:mi>
                                    <mml:mo>^</mml:mo>
                                </mml:mover>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mi>&#x03be;</mml:mi>
                                <mml:mo stretchy="false">)</mml:mo>
                                <mml:mo>=</mml:mo>
                                <mml:mstyle displaystyle="true">
                                    <mml:mrow>
                                        <mml:munderover>
                                            <mml:mo>&#x222b;</mml:mo>
                                            <mml:mrow>
                                                <mml:mo>&#x2212;</mml:mo>
                                                <mml:mi>&#x221e;</mml:mi>
                                            </mml:mrow>
                                            <mml:mi>&#x221e;</mml:mi>
                                        </mml:munderover>
                                        <mml:mrow>
                                            <mml:mi>f</mml:mi>
                                            <mml:mo stretchy="false">(</mml:mo>
                                            <mml:mi>x</mml:mi>
                                            <mml:mo stretchy="false">)</mml:mo>
                                            <mml:msup>
                                                <mml:mi>e</mml:mi>
                                                <mml:mrow>
                                                    <mml:mo>&#x2212;</mml:mo>
                                                    <mml:mn>2</mml:mn>
                                                    <mml:mi>&#x03c0;</mml:mi>
                                                    <mml:mi>i</mml:mi>
                                                    <mml:mi>x</mml:mi>
                                                    <mml:msub>
                                                        <mml:mi>&#x03be;</mml:mi>
                                                        <mml:mrow>
                                                            <mml:mi>d</mml:mi>
                                                            <mml:mi>x</mml:mi>
                                                        </mml:mrow>
                                                    </mml:msub>
                                                </mml:mrow>
                                            </mml:msup>
                                        </mml:mrow>
                                    </mml:mrow>
                                </mml:mstyle>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mn>1</mml:mn>
                                <mml:mo stretchy="false">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </disp-formula>
                </p>
                <p>where 
                    <italic toggle="yes">x</italic> is the temporal variable, 
                    <italic toggle="yes">&#x03be;</italic> it the frequential variable, 
                    <italic toggle="yes">i</italic> is a -1 square root and 
                    <italic toggle="yes">e</italic> is the natural exponent. From 
                    <xref ref-type="other" rid="e1">equation 1</xref>, a derivative can be determined for any point 
                    <italic toggle="yes">&#x03be;</italic> sampled in the signal.</p>
                <p>
                    <disp-formula id="e2">
                        <mml:math display="block" id="math2">
                            <mml:mrow>
                                <mml:mi>f</mml:mi>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mi>x</mml:mi>
                                <mml:mo stretchy="false">)</mml:mo>
                                <mml:mo stretchy="false">[</mml:mo>
                                <mml:msup>
                                    <mml:mrow>
                                        <mml:mi>cos</mml:mi>
                                    </mml:mrow>
                                    <mml:mrow>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>2</mml:mn>
                                        <mml:mi>&#x03c0;</mml:mi>
                                        <mml:mi>e</mml:mi>
                                        <mml:mi>&#x03be;</mml:mi>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:msup>
                                <mml:mo>+</mml:mo>
                                <mml:mi>i</mml:mi>
                                <mml:mo>*</mml:mo>
                                <mml:mtext>&#x200b;</mml:mtext>
                                <mml:msup>
                                    <mml:mrow>
                                        <mml:mi>sin</mml:mi>
                                    </mml:mrow>
                                    <mml:mrow>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>2</mml:mn>
                                        <mml:mi>&#x03c0;</mml:mi>
                                        <mml:mi>e</mml:mi>
                                        <mml:mi>&#x03be;</mml:mi>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:msup>
                                <mml:mo stretchy="false">]</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mn>2</mml:mn>
                                <mml:mo stretchy="false">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </disp-formula>
                </p>
                <p>Fourier transform can be implemented into any complex numerical series, but in a practical sense, the computational cost increases exponentially. Thus, fast Fourier transform (FFT) is more often implemented and can be defined according to Cooley-Tukey algorithm
                    <sup>
                        <xref ref-type="bibr" rid="ref-20">20</xref>
                    </sup> as follows:</p>
                <p>
                    <disp-formula id="e3">
                        <mml:math display="block" id="math3">
                            <mml:mrow>
                                <mml:msub>
                                    <mml:mi>X</mml:mi>
                                    <mml:mi>k</mml:mi>
                                </mml:msub>
                                <mml:mo>=</mml:mo>
                                <mml:mstyle displaystyle="true">
                                    <mml:munderover>
                                        <mml:mo>&#x2211;</mml:mo>
                                        <mml:mrow>
                                            <mml:mi>n</mml:mi>
                                            <mml:mo>=</mml:mo>
                                            <mml:mn>0</mml:mn>
                                        </mml:mrow>
                                        <mml:mrow>
                                            <mml:mi>N</mml:mi>
                                            <mml:mo>&#x2212;</mml:mo>
                                            <mml:mn>1</mml:mn>
                                        </mml:mrow>
                                    </mml:munderover>
                                    <mml:mrow>
                                        <mml:msub>
                                            <mml:mi>x</mml:mi>
                                            <mml:mi>n</mml:mi>
                                        </mml:msub>
                                        <mml:msup>
                                            <mml:mi>e</mml:mi>
                                            <mml:mrow>
                                                <mml:mo>&#x2212;</mml:mo>
                                                <mml:mi>i</mml:mi>
                                                <mml:mi>&#x03c0;</mml:mi>
                                                <mml:mi>k</mml:mi>
                                                <mml:mfrac>
                                                    <mml:mi>n</mml:mi>
                                                    <mml:mi>N</mml:mi>
                                                </mml:mfrac>
                                            </mml:mrow>
                                        </mml:msup>
                                    </mml:mrow>
                                </mml:mstyle>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mn>3</mml:mn>
                                <mml:mo stretchy="false">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </disp-formula>
                </p>
                <p>where 
                    <italic toggle="yes">N</italic> is the vector length, 
                    <italic toggle="yes">x</italic> is the temporal variable, 
                    <italic toggle="yes">i</italic> is a -1 square root and 
                    <italic toggle="yes">e</italic> is the natural exponent; in such matter that an euclidean representation - with the angle, magnitude and phase that corresponds to their position in the signal - exists for any signal dot.</p>
                <p>Therefore, mapping any signal into a vectorial representation that contains information from every original signal dot is possible. From this complex vector, useful data can be retrieved to establish a comparison between them that indirectly represents the original signal&#x2019;s juxtaposition
                    <sup>
                        <xref ref-type="bibr" rid="ref-21">21</xref>
                    </sup>.</p>
            </sec>
            <sec>
                <title>Distance matrix computation</title>
                <p>Inspired by the genomic signal processing alignment-free distance (GAFD) model
                    <sup>
                        <xref ref-type="bibr" rid="ref-22">22</xref>
                    </sup>, each signal corresponding to the PCA-mapped accessions data in a set &#x015c;
                    <sub>
                        <italic toggle="yes">i</italic>
                    </sub> was converted into its frequency representation by applying discrete Fourier transform. Its power spectrum 
                    <mml:math id="math11">
                        <mml:mrow>
                            <mml:msub>
                                <mml:mover accent="true">
                                    <mml:mi>F</mml:mi>
                                    <mml:mo>^</mml:mo>
                                </mml:mover>
                                <mml:mi>i</mml:mi>
                            </mml:msub>
                        </mml:mrow>
                    </mml:math> was then computed. Subsequently, the distance 
                    <italic toggle="yes">d</italic>(
                    <italic toggle="yes">i</italic>, 
                    <italic toggle="yes">j</italic>) for a given pair of comprehensive data signals was calculated by obtaining the mean squared error (MSE) of their respective power spectra:</p>
                <p>
                    <disp-formula id="e4">
                        <mml:math display="block" id="math4">
                            <mml:mrow>
                                <mml:mi>D</mml:mi>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mi>i</mml:mi>
                                <mml:mo>,</mml:mo>
                                <mml:mi>j</mml:mi>
                                <mml:mo stretchy="false">)</mml:mo>
                                <mml:mo>=</mml:mo>
                                <mml:msup>
                                    <mml:mrow>
                                        <mml:mstyle displaystyle="true">
                                            <mml:munder>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mi>x</mml:mi>
                                            </mml:munder>
                                            <mml:mrow>
                                                <mml:mrow>
                                                    <mml:mo>(</mml:mo>
                                                    <mml:mrow>
                                                        <mml:msub>
                                                            <mml:mover accent="true">
                                                                <mml:mi>F</mml:mi>
                                                                <mml:mo>^</mml:mo>
                                                            </mml:mover>
                                                            <mml:mi>i</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo stretchy="false">(</mml:mo>
                                                        <mml:mi>x</mml:mi>
                                                        <mml:mo stretchy="false">)</mml:mo>
                                                        <mml:mo>&#x2212;</mml:mo>
                                                        <mml:msub>
                                                            <mml:mover accent="true">
                                                                <mml:mi>F</mml:mi>
                                                                <mml:mo>^</mml:mo>
                                                            </mml:mover>
                                                            <mml:mi>j</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo stretchy="false">(</mml:mo>
                                                        <mml:mi>x</mml:mi>
                                                        <mml:mo stretchy="false">)</mml:mo>
                                                    </mml:mrow>
                                                    <mml:mo>)</mml:mo>
                                                </mml:mrow>
                                            </mml:mrow>
                                        </mml:mstyle>
                                    </mml:mrow>
                                    <mml:mn>2</mml:mn>
                                </mml:msup>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo>&#x2009;</mml:mo>
                                <mml:mo stretchy="false">(</mml:mo>
                                <mml:mn>4</mml:mn>
                                <mml:mo stretchy="false">)</mml:mo>
                            </mml:mrow>
                        </mml:math>
                    </disp-formula>
                </p>
                <p>Finally, a distance matrix (DM) was created by performing a pairwise comparison of all sequences in the set.</p>
                <p>In parallel, we constructed a point-to-point (RAW) DM on the basis of the MSE given to a pair of signals prior to the PCA analysis.</p>
            </sec>
            <sec>
                <title>Core collection selection</title>
                <p>Selecting a CC by this method requires the generation of a DM for each sample of the MC; this provides the interrelations among samples and enables adequate selection. A schematic of the complete workflow is presented in 
                    <xref ref-type="fig" rid="f1">Figure 1</xref>.</p>
                <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                    <label>Figure 1. </label>
                    <caption>
                        <title>General workflow of the FFT-based core collection selection algorithm.</title>
                        <p>PCA: Principal Component Analysis; FFT: Fast Fourier Transform; CC: Core Collection.</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure1.gif"/>
                </fig>
                <p>In the past, several methodological procedures have been implemented to select 
                    <italic toggle="yes">K</italic> elements from an MC on the basis of information provided by its DM; among such procedures, the most frequently used one is the hierarchical clustering method
                    <sup>
                        <xref ref-type="bibr" rid="ref-11">11</xref>
                    </sup>. However, the current algorithm does not rely on hierarchical clustering for CC selection, instead - similar to the least distance stepwise sampling method
                    <sup>
                        <xref ref-type="bibr" rid="ref-23">23</xref>
                    </sup> - CC elements are selected by an iterative process, where 
                    <italic toggle="yes">r</italic> samples are selected by different criteria (which may be individually implemented) on each iteration.</p>
                <p>Selection criteria (based on the DM without hierarchical clustering) for the current algorithm is as follows:</p>
                <list list-type="bullet">
                    <list-item>
                        <label>&#x2022;</label>
                        <p>a) The 
                            <italic toggle="yes">i</italic>th sample with the most lower distance values among 
                            <italic toggle="yes">j</italic>th elements.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>b) The 
                            <italic toggle="yes">i</italic>th sample with the most higher distance values among 
                            <italic toggle="yes">j</italic>th elements.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>c) The 
                            <italic toggle="yes">i</italic>th sample with a lower distance average.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>d) The 
                            <italic toggle="yes">i</italic>th sample with a higher distance average.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>e) The 
                            <italic toggle="yes">i</italic>th sample with a lower overall distance.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>f) The 
                            <italic toggle="yes">i</italic>th sample with a higher overall distance.</p>
                    </list-item>
                </list>
                <p>In cases where multiple samples share selection values, an appearance priority will complete the criteria.</p>
                <p>An example of selection process is presented in 
                    <xref ref-type="fig" rid="f2">Figure 2</xref> and its final result is presented in 
                    <xref ref-type="fig" rid="f3">Figure 3</xref>.</p>
                <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                    <label>Figure 2. </label>
                    <caption>
                        <p>First three principal component&#x2019;s distribution of 
                            <italic toggle="yes">Rdata</italic> (
                            <italic toggle="yes">a</italic>), methodology&#x2019;s first (
                            <italic toggle="yes">b</italic>), second (
                            <italic toggle="yes">c</italic>) and third (
                            <italic toggle="yes">d</italic>) iterations; final 
                            <italic toggle="yes">K</italic>=72 distribution is presented in (
                            <italic toggle="yes">e</italic>).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure2.gif"/>
                </fig>
                <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                    <label>Figure 3. </label>
                    <caption>
                        <title>First three principal component&#x2019;s distributions of 
                            <italic toggle="yes">K</italic>=72 CC selection (X) from 
                            <italic toggle="yes">Rdata</italic> MC.</title>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure3.gif"/>
                </fig>
                <p>Once the selected samples (
                    <italic toggle="yes">r</italic>) are included in the future CC, they (along with others that are identical to them (
                    <italic toggle="yes">s</italic>)) are removed from 
                    <italic toggle="yes">X</italic> for the next iteration; then, a 
                    <italic toggle="yes">DM</italic>
                    <sub>2</sub> with 
                    <italic toggle="yes">n</italic>
                    <sub>2</sub> = 
                    <italic toggle="yes">n</italic>&#x2013;
                    <italic toggle="yes">r</italic>&#x2013;
                    <italic toggle="yes">s</italic> is calculated. This process will continue 
                    <italic toggle="yes">Z</italic> times until 
                    <italic toggle="yes">R</italic> &gt;= 
                    <italic toggle="yes">K</italic>, where 
                    <italic toggle="yes">R</italic> = (
                    <italic toggle="yes">r</italic>
                    <sub>1</sub> + 
                    <italic toggle="yes">r</italic>
                    <sub>2</sub>&#x2026;.
                    <italic toggle="yes">r</italic>
                    <sub>
                        <italic toggle="yes">Z</italic>
                    </sub> ) and 
                    <italic toggle="yes">K</italic> = 
                    <italic toggle="yes">predefined CC elements desired</italic>.</p>
            </sec>
            <sec>
                <title>Evaluation of the selected core collection</title>
                <p>As discussed previously, the best way to evaluate a CC depends on the purpose of that CC, and even if it can be evaluated from the same dataset from which it was constructed, evaluating it with a different dataset
                    <sup>
                        <xref ref-type="bibr" rid="ref-7">7</xref>
                    </sup> is desirable. In this study, we use other datasets for our evaluation whenever possible. The list given below provides the evaluation parameters implemented in this study.</p>
                <list list-type="bullet">
                    <list-item>
                        <label>a)</label>
                        <p>The average distance between each MC sample and the nearest CC sample (ANE) can be calculated using the equation as follows:</p>
                        <p>
                            <disp-formula id="e5">
                                <mml:math display="block" id="math5">
                                    <mml:mrow>
                                        <mml:mi>A</mml:mi>
                                        <mml:mi>N</mml:mi>
                                        <mml:msub>
                                            <mml:mi>E</mml:mi>
                                            <mml:mrow>
                                                <mml:mi>t</mml:mi>
                                                <mml:mi>o</mml:mi>
                                                <mml:mi>t</mml:mi>
                                            </mml:mrow>
                                        </mml:msub>
                                        <mml:mo>=</mml:mo>
                                        <mml:mfrac>
                                            <mml:mn>1</mml:mn>
                                            <mml:mi>L</mml:mi>
                                        </mml:mfrac>
                                        <mml:mstyle displaystyle="true">
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>k</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mi>K</mml:mi>
                                            </mml:munderover>
                                            <mml:mrow>
                                                <mml:mstyle displaystyle="true">
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>j</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>J</mml:mi>
                                                    </mml:munderover>
                                                    <mml:mrow>
                                                        <mml:mi>D</mml:mi>
                                                        <mml:mo stretchy="false">(</mml:mo>
                                                        <mml:mi>k</mml:mi>
                                                        <mml:mo>&#x2212;</mml:mo>
                                                        <mml:mi>c</mml:mi>
                                                        <mml:mi>M</mml:mi>
                                                        <mml:msub>
                                                            <mml:mi>C</mml:mi>
                                                            <mml:mi>j</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo stretchy="false">)</mml:mo>
                                                    </mml:mrow>
                                                </mml:mstyle>
                                            </mml:mrow>
                                        </mml:mstyle>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>5</mml:mn>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:math>
                            </disp-formula>
                        </p>
                        <p>where 
                            <italic toggle="yes">K</italic> is all CC elements, 
                            <italic toggle="yes">k</italic> is each CC element and 
                            <italic toggle="yes">D</italic> is the distance between 
                            <italic toggle="yes">k</italic> and each 
                            <italic toggle="yes">j</italic>th 
                            <italic toggle="yes">cMC</italic> element whose closest CC element is 
                            <italic toggle="yes">k</italic>, including itself, thus rendering 
                            <italic toggle="yes">L</italic> total comparisons. The ideal ANE value is 0, where each sample of the CC represents itself and those similar to it. This parameter evaluates the homogeneity of the represented MC diversity.</p>
                    </list-item>
                    <list-item>
                        <label>b)</label>
                        <p>The average distance between each CC sample and the nearest CC sample (ENE) can be calculated using the equation as follows:</p>
                        <p>
                            <disp-formula id="e6">
                                <mml:math display="block" id="math6">
                                    <mml:mrow>
                                        <mml:mi>E</mml:mi>
                                        <mml:mi>N</mml:mi>
                                        <mml:msub>
                                            <mml:mi>E</mml:mi>
                                            <mml:mrow>
                                                <mml:mi>t</mml:mi>
                                                <mml:mi>o</mml:mi>
                                                <mml:mi>t</mml:mi>
                                            </mml:mrow>
                                        </mml:msub>
                                        <mml:mo>=</mml:mo>
                                        <mml:mfrac>
                                            <mml:mn>1</mml:mn>
                                            <mml:mi>L</mml:mi>
                                        </mml:mfrac>
                                        <mml:mstyle displaystyle="true">
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>k</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mi>K</mml:mi>
                                            </mml:munderover>
                                            <mml:mrow>
                                                <mml:mi>D</mml:mi>
                                                <mml:mo stretchy="false">(</mml:mo>
                                                <mml:mi>k</mml:mi>
                                                <mml:mo>&#x2212;</mml:mo>
                                                <mml:mi>c</mml:mi>
                                                <mml:mi>C</mml:mi>
                                                <mml:mi>C</mml:mi>
                                                <mml:mo stretchy="false">)</mml:mo>
                                            </mml:mrow>
                                        </mml:mstyle>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>6</mml:mn>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:math>
                            </disp-formula>
                        </p>
                        <p>where 
                            <italic toggle="yes">K</italic> is all CC elements, 
                            <italic toggle="yes">k</italic> is each CC element and 
                            <italic toggle="yes">D</italic> is the distance between 
                            <italic toggle="yes">k</italic> and its closest CC element 
                            <italic toggle="yes">cCC</italic>, excluding itself, in 
                            <italic toggle="yes">L</italic> total comparisons. With such an evaluation parameter, higher dispersion renders higher scores with the aim of evaluating the dispersion among selected CC elements.</p>
                    </list-item>
                    <list-item>
                        <label>c)</label>
                        <p>The average distance between CC samples (E) can be calculated using the equation as follows:</p>
                        <p>
                            <disp-formula id="e7">
                                <mml:math display="block" id="math7">
                                    <mml:mrow>
                                        <mml:msub>
                                            <mml:mi>E</mml:mi>
                                            <mml:mrow>
                                                <mml:mi>t</mml:mi>
                                                <mml:mi>o</mml:mi>
                                                <mml:mi>t</mml:mi>
                                            </mml:mrow>
                                        </mml:msub>
                                        <mml:mo>=</mml:mo>
                                        <mml:mfrac>
                                            <mml:mn>1</mml:mn>
                                            <mml:mi>L</mml:mi>
                                        </mml:mfrac>
                                        <mml:mstyle displaystyle="true">
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>k</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mi>K</mml:mi>
                                            </mml:munderover>
                                            <mml:mrow>
                                                <mml:mstyle displaystyle="true">
                                                    <mml:munderover>
                                                        <mml:mo>&#x2211;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mi>j</mml:mi>
                                                            <mml:mo>=</mml:mo>
                                                            <mml:mn>1</mml:mn>
                                                        </mml:mrow>
                                                        <mml:mi>J</mml:mi>
                                                    </mml:munderover>
                                                    <mml:mrow>
                                                        <mml:mi>D</mml:mi>
                                                        <mml:mo stretchy="false">(</mml:mo>
                                                        <mml:mi>k</mml:mi>
                                                        <mml:mo>&#x2212;</mml:mo>
                                                        <mml:mi>c</mml:mi>
                                                        <mml:mi>C</mml:mi>
                                                        <mml:msub>
                                                            <mml:mi>C</mml:mi>
                                                            <mml:mi>j</mml:mi>
                                                        </mml:msub>
                                                        <mml:mo stretchy="false">)</mml:mo>
                                                    </mml:mrow>
                                                </mml:mstyle>
                                            </mml:mrow>
                                        </mml:mstyle>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>7</mml:mn>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:math>
                            </disp-formula>
                        </p>
                        <p>where 
                            <italic toggle="yes">K</italic> is all CC elements, 
                            <italic toggle="yes">k</italic> is each CC element and 
                            <italic toggle="yes">D</italic> is the distance between 
                            <italic toggle="yes">k</italic> and all other 
                            <italic toggle="yes">j</italic>th CC elements 
                            <italic toggle="yes">cCC</italic>, excluding itself, in 
                            <italic toggle="yes">L</italic> total comparisons. This evaluation parameter indicates higher scores when CC elements have greater distances between themselves.</p>
                        <p>While previous evaluation parameters are useful for data dispersion analysis, such parameters will not evaluate how well the distribution of the MC is represented on the CC; therefore, the distribution comparisons tests that were included are as follows:</p>
                    </list-item>
                    <list-item>
                        <label>d)</label>
                        <p>The homogeneity test (
                            <italic toggle="yes">F</italic> &#x2013; 
                            <italic toggle="yes">test</italic> for variances and 
                            <italic toggle="yes">t</italic> &#x2013; 
                            <italic toggle="yes">test</italic> for means; 
                            <italic toggle="yes">&#x03b1;</italic> = 0.05) between the CC and MC for each trait can be represented as a percentage of traits that are statistically different (MD for means and VT for variances)
                            <sup>
                                <xref ref-type="bibr" rid="ref-9">9</xref>
                            </sup>.</p>
                    </list-item>
                    <list-item>
                        <label>e)</label>
                        <p>The coincidence rate (CR) can be calculated using the equation as follows:</p>
                        <p>
                            <disp-formula id="e8">
                                <mml:math display="block" id="math8">
                                    <mml:mrow>
                                        <mml:mi>C</mml:mi>
                                        <mml:mi>R</mml:mi>
                                        <mml:mo>=</mml:mo>
                                        <mml:mfrac>
                                            <mml:mn>1</mml:mn>
                                            <mml:mi>M</mml:mi>
                                        </mml:mfrac>
                                        <mml:mstyle displaystyle="true">
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>m</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mi>M</mml:mi>
                                            </mml:munderover>
                                            <mml:mrow>
                                                <mml:mfrac>
                                                    <mml:mrow>
                                                        <mml:msub>
                                                            <mml:mi>R</mml:mi>
                                                            <mml:mrow>
                                                                <mml:mi>C</mml:mi>
                                                                <mml:mi>C</mml:mi>
                                                            </mml:mrow>
                                                        </mml:msub>
                                                    </mml:mrow>
                                                    <mml:mrow>
                                                        <mml:msub>
                                                            <mml:mi>R</mml:mi>
                                                            <mml:mrow>
                                                                <mml:mi>M</mml:mi>
                                                                <mml:mi>C</mml:mi>
                                                            </mml:mrow>
                                                        </mml:msub>
                                                    </mml:mrow>
                                                </mml:mfrac>
                                                <mml:mo>&#x2217;</mml:mo>
                                                <mml:mn>100</mml:mn>
                                            </mml:mrow>
                                        </mml:mstyle>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>8</mml:mn>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:math>
                            </disp-formula>
                        </p>
                        <p>where 
                            <italic toggle="yes">R</italic> is the range of each 
                            <italic toggle="yes">m</italic> trait, and 
                            <italic toggle="yes">M</italic> represents the number of traits.</p>
                    </list-item>
                    <list-item>
                        <label>f)</label>
                        <p>The variable rate (CV) can be calculated using the equation as follows:</p>
                        <p>
                            <disp-formula id="e9">
                                <mml:math display="block" id="math9">
                                    <mml:mrow>
                                        <mml:mi>C</mml:mi>
                                        <mml:mi>V</mml:mi>
                                        <mml:mo>=</mml:mo>
                                        <mml:mfrac>
                                            <mml:mn>1</mml:mn>
                                            <mml:mi>M</mml:mi>
                                        </mml:mfrac>
                                        <mml:mstyle displaystyle="true">
                                            <mml:munderover>
                                                <mml:mo>&#x2211;</mml:mo>
                                                <mml:mrow>
                                                    <mml:mi>m</mml:mi>
                                                    <mml:mo>=</mml:mo>
                                                    <mml:mn>1</mml:mn>
                                                </mml:mrow>
                                                <mml:mi>M</mml:mi>
                                            </mml:munderover>
                                            <mml:mrow>
                                                <mml:mfrac>
                                                    <mml:mrow>
                                                        <mml:mi>C</mml:mi>
                                                        <mml:msub>
                                                            <mml:mi>V</mml:mi>
                                                            <mml:mrow>
                                                                <mml:mi>C</mml:mi>
                                                                <mml:mi>C</mml:mi>
                                                            </mml:mrow>
                                                        </mml:msub>
                                                    </mml:mrow>
                                                    <mml:mrow>
                                                        <mml:mi>C</mml:mi>
                                                        <mml:msub>
                                                            <mml:mi>V</mml:mi>
                                                            <mml:mrow>
                                                                <mml:mi>M</mml:mi>
                                                                <mml:mi>C</mml:mi>
                                                            </mml:mrow>
                                                        </mml:msub>
                                                    </mml:mrow>
                                                </mml:mfrac>
                                                <mml:mo>&#x2217;</mml:mo>
                                                <mml:mn>100</mml:mn>
                                            </mml:mrow>
                                        </mml:mstyle>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>9</mml:mn>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:math>
                            </disp-formula>
                        </p>
                        <p>where 
                            <italic toggle="yes">CV</italic> is the coefficient of the variation of each 
                            <italic toggle="yes">m</italic> trait in the CC and MC, and 
                            <italic toggle="yes">M</italic> is the number of traits.</p>
                        <p>According to Hu 
                            <italic toggle="yes">et al.</italic>
                            <sup>
                                <xref ref-type="bibr" rid="ref-10">10</xref>
                            </sup>, a valid CC has 
                            <italic toggle="yes">CR</italic> &gt; 80 and 
                            <italic toggle="yes">MD</italic> &lt; 20, which are the limits for the ideal representation of the identity and distribution of the MC.</p>
                    </list-item>
                    <list-item>
                        <label>g)</label>
                        <p>The alleles coverage (CA) can be calculated using the equation as follows:</p>
                        <p>
                            <disp-formula id="e10">
                                <mml:math display="block" id="math10">
                                    <mml:mrow>
                                        <mml:mi>C</mml:mi>
                                        <mml:mi>A</mml:mi>
                                        <mml:mo>=</mml:mo>
                                        <mml:mrow>
                                            <mml:mo>[</mml:mo>
                                            <mml:mrow>
                                                <mml:mrow>
                                                    <mml:mo>|</mml:mo>
                                                    <mml:mrow>
                                                        <mml:mn>1</mml:mn>
                                                        <mml:mo>&#x2212;</mml:mo>
                                                        <mml:mrow>
                                                            <mml:mo>(</mml:mo>
                                                            <mml:mrow>
                                                                <mml:mrow>
                                                                    <mml:mo>|</mml:mo>
                                                                    <mml:mrow>
                                                                        <mml:mn>1</mml:mn>
                                                                        <mml:mo>&#x2212;</mml:mo>
                                                                        <mml:mi>A</mml:mi>
                                                                        <mml:mi>C</mml:mi>
                                                                        <mml:mi>C</mml:mi>
                                                                    </mml:mrow>
                                                                    <mml:mo>|</mml:mo>
                                                                </mml:mrow>
                                                                <mml:mo>/</mml:mo>
                                                                <mml:mi>A</mml:mi>
                                                                <mml:mi>M</mml:mi>
                                                                <mml:mi>C</mml:mi>
                                                            </mml:mrow>
                                                            <mml:mo>)</mml:mo>
                                                        </mml:mrow>
                                                    </mml:mrow>
                                                    <mml:mo>|</mml:mo>
                                                </mml:mrow>
                                            </mml:mrow>
                                            <mml:mo>]</mml:mo>
                                        </mml:mrow>
                                        <mml:mo>&#x2217;</mml:mo>
                                        <mml:mn>100</mml:mn>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo>&#x2009;</mml:mo>
                                        <mml:mo stretchy="false">(</mml:mo>
                                        <mml:mn>10</mml:mn>
                                        <mml:mo stretchy="false">)</mml:mo>
                                    </mml:mrow>
                                </mml:math>
                            </disp-formula>
                        </p>
                        <p>where ACC is a set of alleles in the CC, and AMC is a set of alleles in the MC; ACC measures the percentage of alleles from the MC that are present in the CC
                            <sup>
                                <xref ref-type="bibr" rid="ref-12">12</xref>
                            </sup>.</p>
                    </list-item>
                </list>
                <p>To compare the obtained CCs with an established methodology, we implemented Core Hunter 2 (CH)
                    <sup>
                        <xref ref-type="bibr" rid="ref-13">13</xref>
                    </sup> as a reference and used it with the program&#x2019;s default parameters on the agrological and genomic datasets.</p>
            </sec>
            <sec>
                <title>Experimental datasets</title>
                <p>To determine the efficiency of the analysis of data behaviour by a point-to-point direct comparison, a synthetic dataset was constructed using binary data (
                    <italic toggle="yes">Sdata</italic>) with manageable 
                    <italic toggle="yes">n</italic> and 
                    <italic toggle="yes">m</italic> elements (
                    <xref ref-type="other" rid="SM1">supplementary material 1</xref>).</p>
                <p>To test the algorithm in real biological-context scenarios, the CCs from different MCs were constructed and evaluated.</p>
                <p>To test the algorithm&#x2019;s CCs versus the scores of the MCs, 780 rice (
                    <italic toggle="yes">Oriza sativa</italic>(L.)) accession and 423 foxtail millet (
                    <italic toggle="yes">Setaria italica</italic> subsp. 
                    <italic toggle="yes">italica</italic> (L.) P. Beauv.) accession data were retrieved from the National Institute of Agrobiological Sciences (NIAS) 
                    <ext-link ext-link-type="uri" xlink:href="http://www.gene.affrc.go.jp/databases_en.php">http://www.gene.affrc.go.jp/databases_en.php</ext-link>.</p>
                <p>According to the available data, different datasets were assembled. The 762 SNPs from the 780 rice accessions retrieved from the NIAS database (
                    <italic toggle="yes">Rdata</italic>) were divided arbitrarily into two subsets of 331 SNPs each for constructing two smaller datasets (
                    <italic toggle="yes">RdataI</italic> and 
                    <italic toggle="yes">RdataIII</italic>). In addition, ATs were categorized and mapped into the binary data for 273 of the 780 accessions, resulting in 38 variables (
                    <italic toggle="yes">RdataII</italic>). The variables from the 423 foxtail millet genotypes with transposon displays
                    <sup>
                        <xref ref-type="bibr" rid="ref-24">24</xref>
                    </sup> were used as a single dataset (
                    <italic toggle="yes">Fdata</italic>). For a subset of 141 accessions (
                    <italic toggle="yes">FdataI</italic>), 9 ATs were categorized and mapped into binary data, resulting in 28 variables (
                    <italic toggle="yes">FdataII</italic>). The substitution tables used during this mapping are presented as 
                    <xref ref-type="other" rid="SM1">supplementary material 1</xref>.</p>
            </sec>
            <sec>
                <title>Implementation</title>
                <p>All methodological procedures (except for CH, which was implemented according to the software&#x2019;s default parameters and which is available for download at 
                    <ext-link ext-link-type="uri" xlink:href="http://www.corehunter.org">www.corehunter.org</ext-link>) were performed using FreeMat v4.2 (
                    <ext-link ext-link-type="uri" xlink:href="http://www.freemat.sourceforge.net">www.freemat.sourceforge.net</ext-link>). All original codes are available as 
                    <xref ref-type="other" rid="SM1">supplementary material 1</xref>.</p>
            </sec>
        </sec>
        <sec sec-type="results | discussion">
            <title>Results and discussion</title>
            <sec>
                <title>Selection and evaluation</title>
                <p>The selection criteria were chosen to look for the best possible distribution of selected CC elements within the DM. Although hierarchical clustering has proven to be an effective method for determining collection structure and sampling CC
                    <sup>
                        <xref ref-type="bibr" rid="ref-25">25</xref>
                    </sup> and although it has been implemented in different crops
                    <sup>
                        <xref ref-type="bibr" rid="ref-26">26</xref>,
                        <xref ref-type="bibr" rid="ref-27">27</xref>
                    </sup> and included in various selection algorithms
                    <sup>
                        <xref ref-type="bibr" rid="ref-11">11</xref>
                    </sup>, hierarchical reconstruction presents the challenge of selecting an appropriate model for biological interpretation that can be applied to everything from unweighted pair-group averages to Markov models in Bayesian estimations
                    <sup>
                        <xref ref-type="bibr" rid="ref-28">28</xref>
                    </sup>. To avoid the challenge of selecting a reconstruction model, we decided to work strictly with the DM. By selecting the items described in this methodology, we aimed to retrieve representative elements from among the distributions of collections; however, because of its iterative nature, this methodology may render high redundancy under certain data distributions. Despite this limitation, the methodology has proven to be capable of selecting representative elements of the MC&#x2019;s diversity.</p>
                <p>Evaluation criteria were applied according to Odong 
                    <italic toggle="yes">et al.</italic>
                    <sup>
                        <xref ref-type="bibr" rid="ref-7">7</xref>
                    </sup> without excluding the classic criteria used in 
                    <xref ref-type="bibr" rid="ref-9">9</xref>,
                    <xref ref-type="bibr" rid="ref-10">10</xref>. The selected CCs render proper results in general terms. As expected, selected CCs did not always reach for optimal values for MD and CR, this is due the fact that it is not the aim of the selection method to render a CC with similar distribution to that of the MC, but to make sure to include as much diversity as possible.</p>
                <p>It is our belief that scoring the CC sets obtained with these methodologies will enable genetic resource banks to provide clear descriptors of what their CC strengths and limitations are with respect to the MC from which they come and will provide adequate tools for determining the possible purposes of the selected CCs.</p>
            </sec>
            <sec>
                <title>Mapping</title>
                <p>Although several representations of genotypic characteristics (particularly those involving DNA sequences
                    <sup>
                        <xref ref-type="bibr" rid="ref-29">29</xref>&#x2013;
                        <xref ref-type="bibr" rid="ref-31">31</xref>
                    </sup>) have been proposed, real-number-based mappings have not been discarded; indeed, this type of mapping has been highly studied for signal analysis even when they share two principal problems: the preferential magnitude of some nucleotides and the non-equidistance of all nucleotides
                    <sup>
                        <xref ref-type="bibr" rid="ref-32">32</xref>,
                        <xref ref-type="bibr" rid="ref-33">33</xref>
                    </sup>. The arbitrary values selected for SNPs&#x2019;s numerical representation of genotypes aim to maintain equidistant relations among purines and among pyrimidines in such a manner that the same distance is also preserved between at least one of them and the undetermined values. ATs are represented as binary data. This representation may prove useful for discrete data but requires a clustering procedure for continuous data. In this study, we arbitrarily generated clusters for the latter and then represented them as the former. Although this implementation may not be the most accurate regarding biological or agronomical significance, it serves as the first approach for testing the feasibility of the use of signal processing techniques when merging several datasets to construct one CC.</p>
            </sec>
            <sec>
                <title>RAW 
                    <italic toggle="yes">versus</italic> FFT</title>
                <p>The RAW comparison establishes a distance value on the basis of the average distance between each mapped value on each element while the FFT power spectra implementation compares the signals in the frequency domain. Using FFT, establishing a DM on the basis of how data &#x2019;shifted&#x2019; rather than on the basis of average point-to-point comparisons was possible. The FFT approach provides a different DM, where its compared elements are clustered based on the similarity of the shift among data, regardless of whether the shift is in the opposite phase. We believe that this procedure may reveal additional information about the relations not only between elements but also between the individual components within each element.</p>
                <p>FFT comparisons of signals without PCA are a good approach for CC selection. Nevertheless, PCA implementation enables us to avoid possible misleads in random data arrangements, as, for example, palindromic data that could result in the same power spectra. Moreover, through PCA, we could organize data according to their levels of impact on the difference between accessions, which - when their magnitudes were obtained - inherently rendered a representation of informativity relations among values. This &#x2019;data behaviour&#x2019; was used as the element for pairwise comparisons, and although this approach clusters differently from RAW comparisons, we believe that it will provide a new perspective for CC selection and open the possibility of further data exploration.</p>
                <p>Our first approach was to measure the comparisons under different 
                    <italic toggle="yes">K</italic> values. We compared the approach of the RAW signals with the PCA-FFT-treated signals. Results from 
                    <italic toggle="yes">Sdata, Fdata</italic> and 
                    <italic toggle="yes">Rdata</italic> are presented in 
                    <xref ref-type="table" rid="T1">Table 1</xref>&#x2013;
                    <xref ref-type="table" rid="T3">Table 3</xref>. As expected, most evaluation criteria improved as 
                    <italic toggle="yes">K</italic> increased.</p>
                <table-wrap id="T1" orientation="portrait" position="anchor">
                    <label>Table 1. </label>
                    <caption>
                        <title>&#x2206; 
                            <italic toggle="yes">K</italic> selected CC scores from MC 
                            <italic toggle="yes">Sdata</italic> Raw and PCA Signal evaluated with 
                            <italic toggle="yes">Sdata</italic>.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="3" rowspan="1">
                                    <italic toggle="yes">Sdata PCA</italic>
							</th>
                                <th align="center" colspan="3" rowspan="1">
								
                                    <italic toggle="yes">Sdata RAW</italic>
							</th>
                            </tr>
                            <tr>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">12</th>
                                <th align="center" colspan="1" rowspan="1">18</th>
                                <th align="center" colspan="1" rowspan="1">24</th>
                                <th align="center" colspan="1" rowspan="1">12</th>
                                <th align="center" colspan="1" rowspan="1">18</th>
                                <th align="center" colspan="1" rowspan="1">24</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.2348</td>
                                <td align="center" colspan="1" rowspan="1">0.2311</td>
                                <td align="center" colspan="1" rowspan="1">0.2164</td>
                                <td align="center" colspan="1" rowspan="1">0.2697</td>
                                <td align="center" colspan="1" rowspan="1">0.2287</td>
                                <td align="center" colspan="1" rowspan="1">0.2164</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.339</td>
                                <td align="center" colspan="1" rowspan="1">0.3386</td>
                                <td align="center" colspan="1" rowspan="1">0.3401</td>
                                <td align="center" colspan="1" rowspan="1">0.3696</td>
                                <td align="center" colspan="1" rowspan="1">0.3228</td>
                                <td align="center" colspan="1" rowspan="1">0.3214</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.5562</td>
                                <td align="center" colspan="1" rowspan="1">0.5622</td>
                                <td align="center" colspan="1" rowspan="1">0.5547</td>
                                <td align="center" colspan="1" rowspan="1">0.5558</td>
                                <td align="center" colspan="1" rowspan="1">0.5333</td>
                                <td align="center" colspan="1" rowspan="1">0.5299</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">41.6667</td>
                                <td align="center" colspan="1" rowspan="1">50</td>
                                <td align="center" colspan="1" rowspan="1">41.6667</td>
                                <td align="center" colspan="1" rowspan="1">33.3333</td>
                                <td align="center" colspan="1" rowspan="1">58.3333</td>
                                <td align="center" colspan="1" rowspan="1">41.6667</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">64.8403</td>
                                <td align="center" colspan="1" rowspan="1">71.6918</td>
                                <td align="center" colspan="1" rowspan="1">73.7154</td>
                                <td align="center" colspan="1" rowspan="1">60.6447</td>
                                <td align="center" colspan="1" rowspan="1">75.2465</td>
                                <td align="center" colspan="1" rowspan="1">80.4716</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">9080.798</td>
                                <td align="center" colspan="1" rowspan="1">61.2074</td>
                                <td align="center" colspan="1" rowspan="1">86.0876</td>
                                <td align="center" colspan="1" rowspan="1">136.6446</td>
                                <td align="center" colspan="1" rowspan="1">139.1418</td>
                                <td align="center" colspan="1" rowspan="1">280.8481</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">AR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">74.3363</td>
                                <td align="center" colspan="1" rowspan="1">81.4159</td>
                                <td align="center" colspan="1" rowspan="1">89.3805</td>
                                <td align="center" colspan="1" rowspan="1">61.9469</td>
                                <td align="center" colspan="1" rowspan="1">77.8761</td>
                                <td align="center" colspan="1" rowspan="1">80.531</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="T2" orientation="portrait" position="anchor">
                    <label>Table 2. </label>
                    <caption>
                        <title>&#x2206; 
                            <italic toggle="yes">K</italic> selected CC scores from MC 
                            <italic toggle="yes">Fdata</italic> Raw and PCA Signal evaluated with 
                            <italic toggle="yes">Fdata</italic>.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="3" rowspan="1">
								
                                    <italic toggle="yes">Fdata PCA</italic>
							</th>
                                <th align="center" colspan="3" rowspan="1">
								
                                    <italic toggle="yes">Fdata RAW</italic>
							</th>
                            </tr>
                            <tr>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">48</th>
                                <th align="center" colspan="1" rowspan="1">72</th>
                                <th align="center" colspan="1" rowspan="1">96</th>
                                <th align="center" colspan="1" rowspan="1">48</th>
                                <th align="center" colspan="1" rowspan="1">72</th>
                                <th align="center" colspan="1" rowspan="1">96</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6454</td>
                                <td align="center" colspan="1" rowspan="1">0.6423</td>
                                <td align="center" colspan="1" rowspan="1">0.6407</td>
                                <td align="center" colspan="1" rowspan="1">0.6489</td>
                                <td align="center" colspan="1" rowspan="1">0.6431</td>
                                <td align="center" colspan="1" rowspan="1">0.643</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.646</td>
                                <td align="center" colspan="1" rowspan="1">0.6472</td>
                                <td align="center" colspan="1" rowspan="1">0.6474</td>
                                <td align="center" colspan="1" rowspan="1">0.65</td>
                                <td align="center" colspan="1" rowspan="1">0.6448</td>
                                <td align="center" colspan="1" rowspan="1">0.6452</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.7297</td>
                                <td align="center" colspan="1" rowspan="1">0.7301</td>
                                <td align="center" colspan="1" rowspan="1">0.7304</td>
                                <td align="center" colspan="1" rowspan="1">0.7231</td>
                                <td align="center" colspan="1" rowspan="1">0.7236</td>
                                <td align="center" colspan="1" rowspan="1">0.7239</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">1.1799</td>
                                <td align="center" colspan="1" rowspan="1">0.59</td>
                                <td align="center" colspan="1" rowspan="1">0.59</td>
                                <td align="center" colspan="1" rowspan="1">1.7699</td>
                                <td align="center" colspan="1" rowspan="1">1.4749</td>
                                <td align="center" colspan="1" rowspan="1">1.4749</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">50.4425</td>
                                <td align="center" colspan="1" rowspan="1">53.6873</td>
                                <td align="center" colspan="1" rowspan="1">56.6372</td>
                                <td align="center" colspan="1" rowspan="1">50.7375</td>
                                <td align="center" colspan="1" rowspan="1">56.0472</td>
                                <td align="center" colspan="1" rowspan="1">55.1622</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">83.6883</td>
                                <td align="center" colspan="1" rowspan="1">87.0605</td>
                                <td align="center" colspan="1" rowspan="1">88.9709</td>
                                <td align="center" colspan="1" rowspan="1">83.5334</td>
                                <td align="center" colspan="1" rowspan="1">86.9308</td>
                                <td align="center" colspan="1" rowspan="1">87.7461</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.8494</td>
                                <td align="center" colspan="1" rowspan="1">0.419</td>
                                <td align="center" colspan="1" rowspan="1">0.7357</td>
                                <td align="center" colspan="1" rowspan="1">1.1037</td>
                                <td align="center" colspan="1" rowspan="1">4.74</td>
                                <td align="center" colspan="1" rowspan="1">0.7361</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VA</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">96.3945</td>
                                <td align="center" colspan="1" rowspan="1">97.7652</td>
                                <td align="center" colspan="1" rowspan="1">98.5995</td>
                                <td align="center" colspan="1" rowspan="1">95.3516</td>
                                <td align="center" colspan="1" rowspan="1">97.497</td>
                                <td align="center" colspan="1" rowspan="1">97.4374</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="T3" orientation="portrait" position="anchor">
                    <label>Table 3. </label>
                    <caption>
                        <title>&#x2206; 
                            <italic toggle="yes">K</italic> selected CC scores from MC 
                            <italic toggle="yes">Rdata</italic> Raw and PCA Signal evaluated with 
                            <italic toggle="yes">Rdata</italic>.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="3" rowspan="1">
								
                                    <italic toggle="yes">Rdata PCA</italic>
							</th>
                                <th align="center" colspan="3" rowspan="1">
								
                                    <italic toggle="yes">Rdata RAW</italic>
							</th>
                            </tr>
                            <tr>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">48</th>
                                <th align="center" colspan="1" rowspan="1">96</th>
                                <th align="center" colspan="1" rowspan="1">156</th>
                                <th align="center" colspan="1" rowspan="1">48</th>
                                <th align="center" colspan="1" rowspan="1">96</th>
                                <th align="center" colspan="1" rowspan="1">156</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6013</td>
                                <td align="center" colspan="1" rowspan="1">0.5966</td>
                                <td align="center" colspan="1" rowspan="1">0.5942</td>
                                <td align="center" colspan="1" rowspan="1">0.6118</td>
                                <td align="center" colspan="1" rowspan="1">0.6052</td>
                                <td align="center" colspan="1" rowspan="1">0.6042</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.5939</td>
                                <td align="center" colspan="1" rowspan="1">0.5944</td>
                                <td align="center" colspan="1" rowspan="1">0.5981</td>
                                <td align="center" colspan="1" rowspan="1">0.6106</td>
                                <td align="center" colspan="1" rowspan="1">0.6085</td>
                                <td align="center" colspan="1" rowspan="1">0.609</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.7105</td>
                                <td align="center" colspan="1" rowspan="1">0.7074</td>
                                <td align="center" colspan="1" rowspan="1">0.7051</td>
                                <td align="center" colspan="1" rowspan="1">0.703</td>
                                <td align="center" colspan="1" rowspan="1">0.7038</td>
                                <td align="center" colspan="1" rowspan="1">0.7054</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">9.1146</td>
                                <td align="center" colspan="1" rowspan="1">5.9896</td>
                                <td align="center" colspan="1" rowspan="1">3.9062</td>
                                <td align="center" colspan="1" rowspan="1">10.1562</td>
                                <td align="center" colspan="1" rowspan="1">5.4688</td>
                                <td align="center" colspan="1" rowspan="1">4.4271</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">42.4479</td>
                                <td align="center" colspan="1" rowspan="1">48.6979</td>
                                <td align="center" colspan="1" rowspan="1">58.0729</td>
                                <td align="center" colspan="1" rowspan="1">57.5521</td>
                                <td align="center" colspan="1" rowspan="1">72.9167</td>
                                <td align="center" colspan="1" rowspan="1">70.0521</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">70.5716</td>
                                <td align="center" colspan="1" rowspan="1">78.477</td>
                                <td align="center" colspan="1" rowspan="1">83.2957</td>
                                <td align="center" colspan="1" rowspan="1">69.9022</td>
                                <td align="center" colspan="1" rowspan="1">78.1045</td>
                                <td align="center" colspan="1" rowspan="1">80.0167</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">1.0171</td>
                                <td align="center" colspan="1" rowspan="1">0.4343</td>
                                <td align="center" colspan="1" rowspan="1">0.3137</td>
                                <td align="center" colspan="1" rowspan="1">7.9407</td>
                                <td align="center" colspan="1" rowspan="1">0.4375</td>
                                <td align="center" colspan="1" rowspan="1">1.1344</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VA</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">92.6758</td>
                                <td align="center" colspan="1" rowspan="1">96.8992</td>
                                <td align="center" colspan="1" rowspan="1">98.5298</td>
                                <td align="center" colspan="1" rowspan="1">93.9856</td>
                                <td align="center" colspan="1" rowspan="1">98.1823</td>
                                <td align="center" colspan="1" rowspan="1">98.5031</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>The use of FFT signals renders better overall scores than the use of RAW signals in 
                    <italic toggle="yes">Sdata</italic> and 
                    <italic toggle="yes">Fdata</italic>; however, this advantage diminishes in 
                    <italic toggle="yes">Rdata</italic>. We speculate that this difference can be explained by the mapping procedures used; further research regarding this matter is encouraged.</p>
                <p>Using the CHs&#x2019; rendered 
                    <italic toggle="yes">K</italic> values, we used both CH and FFT to generate the CCs on the above datasets. The evaluation of these CCs is summarized in 
                    <xref ref-type="table" rid="T4">Table 4</xref> and in 
                    <xref ref-type="fig" rid="f4">Figure 4</xref>, 
                    <xref ref-type="fig" rid="f5">Figure 5</xref>. Both methodologies rendered similar results, yet PCA rendered better results on parameters representing MC distribution; this could be an effect of the selection method&#x2019;s intrinsic redundancy.</p>
                <table-wrap id="T4" orientation="portrait" position="anchor">
                    <label>Table 4. </label>
                    <caption>
                        <title>CCs selected from MC 
                            <italic toggle="yes">Sdata</italic>, 
                            <italic toggle="yes">Fdata</italic> and 
                            <italic toggle="yes">Rdata</italic> using PCA signals and 
                            <italic toggle="yes">Core Hunter</italic> compared with respective same data.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="2" rowspan="1">
                                    <italic toggle="yes">Sdata</italic>
                                </th>
                                <th align="center" colspan="2" rowspan="1">
                                    <italic toggle="yes">Fdata</italic>
                                </th>
                                <th align="center" colspan="2" rowspan="1">
                                    <italic toggle="yes">Rdata</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">PCA</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CH</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">PCA</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CH</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">PCA</italic>
                                </th>
                                <th align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CH</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="2" rowspan="1">12</th>
                                <th align="center" colspan="2" rowspan="1">84</th>
                                <th align="center" colspan="2" rowspan="1">156</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.2348</td>
                                <td align="center" colspan="1" rowspan="1">0.2314</td>
                                <td align="center" colspan="1" rowspan="1">0.6407</td>
                                <td align="center" colspan="1" rowspan="1">0.6392</td>
                                <td align="center" colspan="1" rowspan="1">0.5942</td>
                                <td align="center" colspan="1" rowspan="1">0.5952</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.339</td>
                                <td align="center" colspan="1" rowspan="1">0.3906</td>
                                <td align="center" colspan="1" rowspan="1">0.6474</td>
                                <td align="center" colspan="1" rowspan="1">0.6386</td>
                                <td align="center" colspan="1" rowspan="1">0.5981</td>
                                <td align="center" colspan="1" rowspan="1">0.6047</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.5562</td>
                                <td align="center" colspan="1" rowspan="1">0.563</td>
                                <td align="center" colspan="1" rowspan="1">0.7304</td>
                                <td align="center" colspan="1" rowspan="1">0.7176</td>
                                <td align="center" colspan="1" rowspan="1">0.7051</td>
                                <td align="center" colspan="1" rowspan="1">0.7017</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0.59</td>
                                <td align="center" colspan="1" rowspan="1">1.1799</td>
                                <td align="center" colspan="1" rowspan="1">3.9062</td>
                                <td align="center" colspan="1" rowspan="1">5.4688</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">41.6667</td>
                                <td align="center" colspan="1" rowspan="1">58.3333</td>
                                <td align="center" colspan="1" rowspan="1">56.6372</td>
                                <td align="center" colspan="1" rowspan="1">66.6667</td>
                                <td align="center" colspan="1" rowspan="1">58.0729</td>
                                <td align="center" colspan="1" rowspan="1">86.7188</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">65.6045</td>
                                <td align="center" colspan="1" rowspan="1">76.1001</td>
                                <td align="center" colspan="1" rowspan="1">88.9709</td>
                                <td align="center" colspan="1" rowspan="1">93.0119</td>
                                <td align="center" colspan="1" rowspan="1">83.2957</td>
                                <td align="center" colspan="1" rowspan="1">89.6723</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">9080.978</td>
                                <td align="center" colspan="1" rowspan="1">132.6078</td>
                                <td align="center" colspan="1" rowspan="1">0.7357</td>
                                <td align="center" colspan="1" rowspan="1">0.429</td>
                                <td align="center" colspan="1" rowspan="1">0.3137</td>
                                <td align="center" colspan="1" rowspan="1">0.4001</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">AR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">74.3363</td>
                                <td align="center" colspan="1" rowspan="1">76.9912</td>
                                <td align="center" colspan="1" rowspan="1">98.5995</td>
                                <td align="center" colspan="1" rowspan="1">98.4803</td>
                                <td align="center" colspan="1" rowspan="1">98.5298</td>
                                <td align="center" colspan="1" rowspan="1">99.3852</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig fig-type="figure" id="f4" orientation="portrait" position="float">
                    <label>Figure 4. </label>
                    <caption>
                        <p>First two principal component&#x2019;s distributions of 
                            <italic toggle="yes">k</italic>=11 CC (orange) selected by 
                            <italic toggle="yes">CH</italic> (
                            <italic toggle="yes">a</italic>), 
                            <italic toggle="yes">PCA</italic> (
                            <italic toggle="yes">b</italic>) and 
                            <italic toggle="yes">RAW</italic> (
                            <italic toggle="yes">c</italic>) in 
                            <italic toggle="yes">Sdata</italic> distribution (blue).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure4.gif"/>
                </fig>
                <fig fig-type="figure" id="f5" orientation="portrait" position="float">
                    <label>Figure 5. </label>
                    <caption>
                        <p>First two principal component&#x2019;s distributions of 
                            <italic toggle="yes">k</italic>=84 CC (orange) selected by 
                            <italic toggle="yes">CH</italic> (
                            <italic toggle="yes">a</italic>) and 
                            <italic toggle="yes">PCA</italic> (
                            <italic toggle="yes">b</italic>) in 
                            <italic toggle="yes">Fdata</italic> distribution (blue).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure5.gif"/>
                </fig>
                <p>Thus far, the proposed CC selection method and algorithm appear worthy of further exploration. We are aware that two particular fundamental elements require immediate attention. First, a better mapping solution for both genotypic and AT numerical representation needs to be determined. Second, the selection system developed by us is directly based on the DM and is prone to high redundancy in some data distributions. As discussed earlier, this selection system was chosen in order to avoid the problems associated with hierarchical clustering and further allocation selections
                    <sup>
                        <xref ref-type="bibr" rid="ref-13">13</xref>,
                        <xref ref-type="bibr" rid="ref-34">34</xref>
                    </sup>. Both issues should be addressed in the near future.</p>
            </sec>
            <sec>
                <title>Comprehensive data analysis</title>
                <p>To demonstrate that FFT-based CC selection can include and analyse data regardless of its origin, we concatenated corresponding signals from 
                    <italic toggle="yes">FdataI</italic> with 
                    <italic toggle="yes">FdataII</italic> as well as 
                    <italic toggle="yes">RdataI</italic> and 
                    <italic toggle="yes">RdataIII</italic> with 
                    <italic toggle="yes">RdataII</italic> to construct 
                    <italic toggle="yes">MFdata</italic>, 
                    <italic toggle="yes">MRdataI</italic> and 
                    <italic toggle="yes">MRdataIII</italic>. The comprehensive sets were used to construct CCs; the sets were then compared with both their original genotype and phenotype MCs. These comparisons are shown in 
                    <xref ref-type="table" rid="T5">Table 5</xref>&#x2013;
                    <xref ref-type="table" rid="T8">Table 8</xref>, and their distributions are represented in 
                    <xref ref-type="fig" rid="f6">Figure 6</xref>&#x2013;
                    <xref ref-type="fig" rid="f9">Figure 9</xref>.</p>
                <table-wrap id="T5" orientation="portrait" position="anchor">
                    <label>Table 5. </label>
                    <caption>
                        <title>CCs selected from MC 
                            <italic toggle="yes">FdataI</italic> and MC 
                            <italic toggle="yes">MFdata</italic> PCA signals and evaluated with 
                            <italic toggle="yes">FdataI</italic> and 
                            <italic toggle="yes">FdataII</italic>
                        </title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="2" rowspan="1">
                                    <italic toggle="yes">vs FdataI</italic>
                                </th>
                                <th align="center" colspan="2" rowspan="1">
                                    <italic toggle="yes">vs FdataII</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">FdataI</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MFdata</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">FdataII</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MFdata</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="4" rowspan="1">24</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6333</td>
                                <td align="center" colspan="1" rowspan="1">0.6356</td>
                                <td align="center" colspan="1" rowspan="1">0.4049</td>
                                <td align="center" colspan="1" rowspan="1">0.4093</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6413</td>
                                <td align="center" colspan="1" rowspan="1">0.6423</td>
                                <td align="center" colspan="1" rowspan="1">0.4374</td>
                                <td align="center" colspan="1" rowspan="1">0.4351</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.7194</td>
                                <td align="center" colspan="1" rowspan="1">0.7113</td>
                                <td align="center" colspan="1" rowspan="1">0.623</td>
                                <td align="center" colspan="1" rowspan="1">0.5914</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">1.7668</td>
                                <td align="center" colspan="1" rowspan="1">2.4735</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">66.0777</td>
                                <td align="center" colspan="1" rowspan="1">33.9223</td>
                                <td align="center" colspan="1" rowspan="1">46.42</td>
                                <td align="center" colspan="1" rowspan="1">64.2857</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">89.4908</td>
                                <td align="center" colspan="1" rowspan="1">89.8198</td>
                                <td align="center" colspan="1" rowspan="1">80.677</td>
                                <td align="center" colspan="1" rowspan="1">82.1913</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">45.7033</td>
                                <td align="center" colspan="1" rowspan="1">35.6847</td>
                                <td align="center" colspan="1" rowspan="1">21.8658</td>
                                <td align="center" colspan="1" rowspan="1">132.1517</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">AR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">91.7647</td>
                                <td align="center" colspan="1" rowspan="1">92.7206</td>
                                <td align="center" colspan="1" rowspan="1">97.5904</td>
                                <td align="center" colspan="1" rowspan="1">94.3775</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="T6" orientation="portrait" position="anchor">
                    <label>Table 6. </label>
                    <caption>
                        <title>CCs selected from MC 
                            <italic toggle="yes">RdataI</italic>, 
                            <italic toggle="yes">MRdataI</italic>, 
                            <italic toggle="yes">RdataIII</italic> and 
                            <italic toggle="yes">MRdataIII</italic> PCA signals and evaluated with 
                            <italic toggle="yes">RdataI</italic>.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="4" rowspan="1">
                                    <italic toggle="yes">vs RdataI</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">RdataI</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MRdataI</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">RdataIII</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MRdataIII</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="4" rowspan="1">24</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6148</td>
                                <td align="center" colspan="1" rowspan="1">0.6156</td>
                                <td align="center" colspan="1" rowspan="1">0.6251</td>
                                <td align="center" colspan="1" rowspan="1">0.6169</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.5989</td>
                                <td align="center" colspan="1" rowspan="1">0.6107</td>
                                <td align="center" colspan="1" rowspan="1">0.621</td>
                                <td align="center" colspan="1" rowspan="1">0.6194</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6962</td>
                                <td align="center" colspan="1" rowspan="1">0.6909</td>
                                <td align="center" colspan="1" rowspan="1">0.6985</td>
                                <td align="center" colspan="1" rowspan="1">0.6934</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">8.8542</td>
                                <td align="center" colspan="1" rowspan="1">8.5938</td>
                                <td align="center" colspan="1" rowspan="1">7.2917</td>
                                <td align="center" colspan="1" rowspan="1">6.7708</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">52.0833</td>
                                <td align="center" colspan="1" rowspan="1">63.5417</td>
                                <td align="center" colspan="1" rowspan="1">52.0833</td>
                                <td align="center" colspan="1" rowspan="1">53.3854</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">80.7367</td>
                                <td align="center" colspan="1" rowspan="1">83.768</td>
                                <td align="center" colspan="1" rowspan="1">81.7278</td>
                                <td align="center" colspan="1" rowspan="1">81.8623</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">56.3949</td>
                                <td align="center" colspan="1" rowspan="1">59.6279</td>
                                <td align="center" colspan="1" rowspan="1">45.6875</td>
                                <td align="center" colspan="1" rowspan="1">199.9377</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">AR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">86.5097</td>
                                <td align="center" colspan="1" rowspan="1">88.144</td>
                                <td align="center" colspan="1" rowspan="1">86.5651</td>
                                <td align="center" colspan="1" rowspan="1">90.7202</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="T7" orientation="portrait" position="anchor">
                    <label>Table 7. </label>
                    <caption>
                        <title>CCs selected from MC 
                            <italic toggle="yes">RdataI</italic>, 
                            <italic toggle="yes">MRdataI</italic>, 
                            <italic toggle="yes">RdataIII</italic> and 
                            <italic toggle="yes">MRdataIII</italic> PCA signals and evaluated with 
                            <italic toggle="yes">RdataIII</italic>.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="4" rowspan="1">
                                    <italic toggle="yes">vs RdataIII</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">RdataI</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MRdataI</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">RdataIII</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MRdataIII</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="4" rowspan="1">24</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6285</td>
                                <td align="center" colspan="1" rowspan="1">0.6276</td>
                                <td align="center" colspan="1" rowspan="1">0.6314</td>
                                <td align="center" colspan="1" rowspan="1">0.623</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6273</td>
                                <td align="center" colspan="1" rowspan="1">0.6294</td>
                                <td align="center" colspan="1" rowspan="1">0.6368</td>
                                <td align="center" colspan="1" rowspan="1">0.6267</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.7036</td>
                                <td align="center" colspan="1" rowspan="1">0.7054</td>
                                <td align="center" colspan="1" rowspan="1">0.7226</td>
                                <td align="center" colspan="1" rowspan="1">0.7056</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">8.0729</td>
                                <td align="center" colspan="1" rowspan="1">7.5521</td>
                                <td align="center" colspan="1" rowspan="1">7.2917</td>
                                <td align="center" colspan="1" rowspan="1">10.4167</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">52.8646</td>
                                <td align="center" colspan="1" rowspan="1">60.6771</td>
                                <td align="center" colspan="1" rowspan="1">51.5625</td>
                                <td align="center" colspan="1" rowspan="1">46.875</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">79.5995</td>
                                <td align="center" colspan="1" rowspan="1">81.0356</td>
                                <td align="center" colspan="1" rowspan="1">79.6809</td>
                                <td align="center" colspan="1" rowspan="1">84.53</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">28.3673</td>
                                <td align="center" colspan="1" rowspan="1">56.3689</td>
                                <td align="center" colspan="1" rowspan="1">90.0475</td>
                                <td align="center" colspan="1" rowspan="1">60.7279</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">AR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">88.9071</td>
                                <td align="center" colspan="1" rowspan="1">88.7705</td>
                                <td align="center" colspan="1" rowspan="1">87.5956</td>
                                <td align="center" colspan="1" rowspan="1">93.0471</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="T8" orientation="portrait" position="anchor">
                    <label>Table 8. </label>
                    <caption>
                        <title>CCs selected from MC 
                            <italic toggle="yes">RdataI</italic>, 
                            <italic toggle="yes">MRdataI</italic>, 
                            <italic toggle="yes">RdataIII</italic> and 
                            <italic toggle="yes">MRdataIII</italic> PCA signals and evaluated with 
                            <italic toggle="yes">RdataII</italic>.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th align="center" colspan="3" rowspan="1">
                                    <italic toggle="yes">vs RdataII</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1"/>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">RdataII</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MRdataI</italic>
                                </th>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">MRdataIII</italic>
                                </th>
                            </tr>
                            <tr>
                                <th colspan="1" rowspan="1">
                                    <italic toggle="yes">K</italic>
                                </th>
                                <th align="center" colspan="3" rowspan="1">24</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ANE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.4594</td>
                                <td align="center" colspan="1" rowspan="1">0.4652</td>
                                <td align="center" colspan="1" rowspan="1">0.4618</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">ENE</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.4796</td>
                                <td align="center" colspan="1" rowspan="1">0.4896</td>
                                <td align="center" colspan="1" rowspan="1">0.4742</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">E</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0.6402</td>
                                <td align="center" colspan="1" rowspan="1">0.6205</td>
                                <td align="center" colspan="1" rowspan="1">0.6169</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">MD</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                                <td align="center" colspan="1" rowspan="1">5.2632</td>
                                <td align="center" colspan="1" rowspan="1">0</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">VT</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">39.4737</td>
                                <td align="center" colspan="1" rowspan="1">42.1053</td>
                                <td align="center" colspan="1" rowspan="1">60.5263</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">63.8082</td>
                                <td align="center" colspan="1" rowspan="1">61.8988</td>
                                <td align="center" colspan="1" rowspan="1">68.2437</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">CV</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">3.8262</td>
                                <td align="center" colspan="1" rowspan="1">2.2285</td>
                                <td align="center" colspan="1" rowspan="1">4.1332</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1">
                                    <italic toggle="yes">AR</italic>
                                </td>
                                <td align="center" colspan="1" rowspan="1">95.4268</td>
                                <td align="center" colspan="1" rowspan="1">98.7805</td>
                                <td align="center" colspan="1" rowspan="1">98.7805</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig fig-type="figure" id="f6" orientation="portrait" position="float">
                    <label>Figure 6. </label>
                    <caption>
                        <p>First two principal component&#x2019;s distributions of 
                            <italic toggle="yes">k</italic>=24 CC (orange) selected by 
                            <italic toggle="yes">PCA</italic> from 
                            <italic toggle="yes">FDataI</italic> (
                            <italic toggle="yes">a</italic>) and 
                            <italic toggle="yes">MDataI</italic> (
                            <italic toggle="yes">b</italic>) in 
                            <italic toggle="yes">FdataI</italic> distribution (blue).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure6.gif"/>
                </fig>
                <fig fig-type="figure" id="f7" orientation="portrait" position="float">
                    <label>Figure 7. </label>
                    <caption>
                        <p>First two principal component&#x2019;s distributions of 
                            <italic toggle="yes">k</italic>=24 CC (orange) selected by 
                            <italic toggle="yes">PCA</italic> from 
                            <italic toggle="yes">FDataII</italic> (
                            <italic toggle="yes">a</italic>) and 
                            <italic toggle="yes">MDataI</italic> (
                            <italic toggle="yes">b</italic>) in 
                            <italic toggle="yes">FdataII</italic> distribution (blue).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure7.gif"/>
                </fig>
                <fig fig-type="figure" id="f8" orientation="portrait" position="float">
                    <label>Figure 8. </label>
                    <caption>
                        <p>First two principal component&#x2019;s distributions of 
                            <italic toggle="yes">k</italic>=24 CC (orange) selected by 
                            <italic toggle="yes">PCA</italic> from 
                            <italic toggle="yes">RDataIII</italic> (
                            <italic toggle="yes">a</italic>) and 
                            <italic toggle="yes">MDataIII</italic> (
                            <italic toggle="yes">b</italic>) in 
                            <italic toggle="yes">RDataI</italic> distribution (blue).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure8.gif"/>
                </fig>
                <fig fig-type="figure" id="f9" orientation="portrait" position="float">
                    <label>Figure 9. </label>
                    <caption>
                        <p>First two principal component&#x2019;s distributions of 
                            <italic toggle="yes">k</italic>=24 CC (orange) selected by 
                            <italic toggle="yes">PCA</italic> from 
                            <italic toggle="yes">RDataII</italic> (
                            <italic toggle="yes">a</italic>) and 
                            <italic toggle="yes">MRDataI</italic> (
                            <italic toggle="yes">b</italic>) in 
                            <italic toggle="yes">RdataII</italic> distribution (blue).</p>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/6857/ae10c947-df55-41ba-8b6b-8759d1e5d579_figure9.gif"/>
                </fig>
                <p>These comprehensive CCs showed overall better scores than genotypic-only CCs when compared with genotypic-only data. On the contrary, there was a better overall score in phenotypic-only CCs when compared against phenotypic-only data. In the latter case, it should be kept in mind that comprehensive data also consider genotypic data; this could explain why better selections are made when only phenotypic data are considered because genotypic variations may reduce the impact of some phenotypic traits in the PCA analysis.</p>
                <p>The generation of a DM based on signal comparisons originating from mixed data construction enables us to explore one of the most interesting applications of this algorithm. By mapping genotypic and AT data, constructing a single signal with all data available for a particular accession is possible. The possibility of including genotypic data with phenotypic traits, geographical locations, climates, habitats, nutritional requirements, symbiotic relationships and so forth provides an opportunity for determining the best information to be included in the selection process in order to cope with the particular objectives for which that CC is being selected. This concept, in addition to adequate scoring systems, may prove useful in designing tailored CCs that comply with specific research/breeding objectives.</p>
            </sec>
        </sec>
        <sec sec-type="conclusions">
            <title>Conclusions</title>
            <p>The use of SPTs in CC selection, as presented in this algorithm, enables us to analyse all available data comprehensively and from different perspectives. Despite its limitations, this signal construction makes it possible to analyse all available data regarding each accession in CC selection with good results. The efficiency of SPTs in CC selection suggests that the use of these tools in MC analysis may provide useful information not only for CC but also for other purposes. The implementation of current and other SPTs in all-inclusive MC-mapped signals is worth further exploration, and we believe that it will be an important asset to genetic resource management and exploitation.</p>
        </sec>
    </body>
    <back>
        <ack>
            <title>Acknowledgements</title>
            <p>We would like to thank F1000Research for the free-submission prize awarded at ISCB-ASIA 2014.</p>
        </ack>
        <sec id="SM1">
            <title>Supplementary Material 1</title>
            <p>
					
                <bold>Genomic and AT numerical mapping equivalences and Original Codes</bold>
            </p>
            <list list-type="bullet">
                <list-item>
                    <p>
                        <ext-link ext-link-type="uri" xlink:href="https://f1000researchdata.s3.amazonaws.com/supplementary/6391/675681b2-b751-4c73-9cac-060c68eeaf25.csv">SyntheticData.cvs</ext-link> : Synthetic Data representing binary information.</p>
                </list-item>
                <list-item>
                    <p>
                        <ext-link ext-link-type="uri" xlink:href="https://f1000researchdata.s3.amazonaws.com/supplementary/6391/516191de-96c0-4865-86c4-4dd8390eea6d.csv">FoxtailATMap.cvs</ext-link> : Mapped Rice AT where 1=&#x2019;presence&#x2019;; 0=&#x2019;absence&#x2019; (corresponds to 
                        <italic toggle="yes">FdataII</italic>).</p>
                </list-item>
                <list-item>
                    <p>
                        <ext-link ext-link-type="uri" xlink:href="https://f1000researchdata.s3.amazonaws.com/supplementary/6391/8f1d8ea7-0201-4b25-9b39-002a0a78d107.csv">FoxtailGenMap.cvs</ext-link> : Mapped Foxtail Genotype where 1=&#x2019;presence&#x2019;; 0=&#x2019;absence&#x2019; (corresponds to 
                        <italic toggle="yes">FdataI</italic>).</p>
                </list-item>
                <list-item>
                    <p>
                        <ext-link ext-link-type="uri" xlink:href="https://f1000researchdata.s3.amazonaws.com/supplementary/6391/9a5f1fba-3aac-4e17-9139-4e85ff759477.csv">RiceATMap.cvs</ext-link> : Mapped Rice AT where 1=&#x2019;presence&#x2019;; 0=&#x2019;absence&#x2019; (corresponds to 
                        <italic toggle="yes">RdataII</italic>).</p>
                </list-item>
                <list-item>
                    <p>
                        <ext-link ext-link-type="uri" xlink:href="https://f1000researchdata.s3.amazonaws.com/supplementary/6391/ce56ba68-4d79-4401-ae45-7f28bae8bedc.csv">RiceGenIMap.cvs</ext-link> : Mapped RICE SNPs where 1="T"; 2="C"; 4="N"; 6="G" and 7="A" (corresponds to 
                        <italic toggle="yes">RdataI</italic>).</p>
                </list-item>
                <list-item>
                    <p>
                        <ext-link ext-link-type="uri" xlink:href="https://f1000researchdata.s3.amazonaws.com/supplementary/6391/bcbf58d4-be80-4643-b8de-1be64cf2b000.csv">RiceGenIIIMap.cvs</ext-link> : Mapped RICE SNPs where 1="T"; 2="C"; 4="N"; 6="G" and 7="A" (corresponds to 
                        <italic toggle="yes">RdataIII</italic>).</p>
                </list-item>
            </list>
            <p>Codes are enclosed as scripts in FFTCoreCollCodes.rar, available online at 
                <ext-link ext-link-type="uri" xlink:href="https://zenodo.org/badge/doi/10.5281/zenodo.16895.svg">https://zenodo.org/badge/doi/10.5281/zenodo.16895.svg</ext-link> Refer to README.m for details.</p>
        </sec>
        <ref-list>
            <ref id="ref-1">
                <label>1</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Watanabe</surname>
                            <given-names>KN</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Iwanaga</surname>
                            <given-names>M</given-names>
                        </name>
					</person-group>:
                    <article-title>Plant Genetic Resources and its Global Contribution.</article-title>
                    <source>
						
                        <italic toggle="yes">Plant Biotechnol.</italic>
					</source>
                    <year>1999</year>;<volume>1</volume>(<issue>16</issue>):<fpage>7</fpage>&#x2013;<lpage>13</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.bunken.org/jspcmb/journal/pb16_1/pb16_1_007.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-2">
                <label>2</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Dulloo</surname>
                            <given-names>ME</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Hunter</surname>
                            <given-names>D</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Borelli</surname>
                            <given-names>T</given-names>
                        </name>
					</person-group>:
                    <article-title>
						
                        <italic toggle="yes">Ex situ</italic> and 
                        <italic toggle="yes">in situ</italic> conservation of agricultural biodiversity: major advances and research needs.</article-title>
                    <source>
						
                        <italic toggle="yes">Not Bot Horti Agrobot Cluj Napoca.</italic>
					</source>
                    <year>2010</year>;<volume>38</volume>(<issue>2</issue>):<fpage>123</fpage>&#x2013;<lpage>135</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.notulaebotanicae.ro/index.php/nbha/article/view/4878">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-3">
                <label>3</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Upadhyaya</surname>
                            <given-names>HD</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Gowda</surname>
                            <given-names>CLL</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Sastry</surname>
                            <given-names>D</given-names>
                        </name>
					</person-group>:
                    <article-title>Plant genetic resources management: collection, characterization, conservation and utilization.</article-title>
                    <source>
						
                        <italic toggle="yes">J SAT Agricultural Res.</italic>
					</source>
                    <year>2008</year>;<fpage>1</fpage>&#x2013;<lpage>16</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://oar.icrisat.org/2744/">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-4">
                <label>4</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>HD</given-names>
                        </name>
					</person-group>:
                    <article-title>Core collections: a practical approach to genetic resources management.</article-title>
                    <source>
						
                        <italic toggle="yes">Genome.</italic>
					</source>
                    <year>1989</year>;<volume>31</volume>(<issue>2</issue>):<fpage>818</fpage>&#x2013;<lpage>824</lpage>.
                    <pub-id pub-id-type="doi">10.1139/g89-144</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-5">
                <label>5</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Guo</surname>
                            <given-names>Y</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>Y</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Hong</surname>
                            <given-names>H</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Establishment of the integrated applied core collection and its comparison with mini core collection in soybean (
                        <italic toggle="yes">Glycine max</italic>).</article-title>
                    <source>
						
                        <italic toggle="yes">The Crop Journal.</italic>
					</source>
                    <year>2014</year>;<volume>2</volume>(<issue>1</issue>):<fpage>38</fpage>&#x2013;<lpage>45</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.cj.2013.11.001</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-6">
                <label>6</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Studnicki</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Madry</surname>
                            <given-names>W</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Schmidt</surname>
                            <given-names>J</given-names>
                        </name>
					</person-group>:
                    <article-title>Efficiency of Sampling Strategies to Establish a Representative in the Phenotypic-based Genetic Diversity Core Collection of Orchardgrass (
                        <italic toggle="yes">Dactylis glomerata</italic>).</article-title>
                    <source>
						
                        <italic toggle="yes">Czech J Genet Plant Breed.</italic>
					</source>
                    <year>2013</year>;<volume>2013</volume>(<issue>1</issue>):<fpage>36</fpage>&#x2013;<lpage>47</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.agriculturejournals.cz/publicFiles/84712.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-7">
                <label>7</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Odong</surname>
                            <given-names>TL</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Jansen</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>van Eeuwijk</surname>
                            <given-names>FA</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Quality of core collections for effective utilisation of genetic resources review, discussion and interpretation.</article-title>
                    <source>
						
                        <italic toggle="yes">Theor Appl Genet.</italic>
					</source>
                    <year>2013</year>;<volume>126</volume>(<issue>2</issue>):<fpage>289</fpage>&#x2013;<lpage>305</lpage>.
                    <pub-id pub-id-type="pmid">22983567</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s00122-012-1971-y</pub-id>
                    <pub-id pub-id-type="pmcid">3555244</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-8">
                <label>8</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Richards</surname>
                            <given-names>CM</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Volk</surname>
                            <given-names>GM</given-names>
                        </name>
					</person-group>:
                    <article-title>Selection of stratified core sets representing wild apple (
                        <italic toggle="yes">Malus sieversii</italic>).</article-title>
                    <source>
						
                        <italic toggle="yes">J Am Soc Hortic Sci.</italic>
					</source>
                    <year>2009</year>;<volume>134</volume>(<issue>2</issue>):<fpage>228</fpage>&#x2013;<lpage>235</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://naldc.nal.usda.gov/naldc/download.xhtml?id=32625&amp;content=PDF">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-9">
                <label>9</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Franco</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Crossa</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Warburton</surname>
                            <given-names>ML</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Sampling Strategies for Conserving Maize Diversity When Forming Core Subsets Using Genetic Markers.</article-title>
                    <source>
						
                        <italic toggle="yes">Crop Sci.</italic>
					</source>
                    <year>2006</year>;<volume>46</volume>(<issue>2</issue>):<fpage>854</fpage>&#x2013;<lpage>864</lpage>.
                    <pub-id pub-id-type="doi">10.2135/cropsci2005.07-0201</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-10">
                <label>10</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Hu</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>HM</given-names>
                        </name>
					</person-group>:
                    <article-title>Methods of constructing core collections by stepwise clustering with three sampling strategies based on the genotypic values of crops.</article-title>
                    <source>
						
                        <italic toggle="yes">Theor Appl Genet.</italic>
					</source>
                    <year>2000</year>;<volume>101</volume>(<issue>1&#x2013;2</issue>):<fpage>264</fpage>&#x2013;<lpage>268</lpage>.
                    <pub-id pub-id-type="doi">10.1007/s001220051478</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-11">
                <label>11</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>JC</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Hu</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Huang</surname>
                            <given-names>XX</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Assessment of different genetic distances in constructing cotton core subset by genotypic values.</article-title>
                    <source>
						
                        <italic toggle="yes">J Zhejiang Univ Sci B.</italic>
					</source>
                    <year>2008</year>;<volume>9</volume>(<issue>5</issue>):<fpage>356</fpage>&#x2013;<lpage>62</lpage>.
                    <pub-id pub-id-type="pmid">18500774</pub-id>
                    <pub-id pub-id-type="doi">10.1631/jzus.B0710615</pub-id>
                    <pub-id pub-id-type="pmcid">2367373</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-12">
                <label>12</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Thachuk</surname>
                            <given-names>C</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Crossa</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Franco</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Core Hunter: an algorithm for sampling genetic resources based on multiple genetic measures.</article-title>
                    <source>
						
                        <italic toggle="yes">BMC Bioinformatics.</italic>
					</source>
                    <year>2009</year>;<volume>10</volume>:<fpage>243</fpage>.
                    <pub-id pub-id-type="pmid">19660135</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-10-243</pub-id>
                    <pub-id pub-id-type="pmcid">2734557</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-13">
                <label>13</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>De Beukelaer</surname>
                            <given-names>H</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Sm&#x00fd;kal</surname>
                            <given-names>P</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Davenport</surname>
                            <given-names>GF</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Core Hunter II: fast core subset selection based on multiple genetic diversity measures using Mixed Replica search.</article-title>
                    <source>
						
                        <italic toggle="yes">BMC Bioinformatics.</italic>
					</source>
                    <year>2012</year>;<volume>13</volume>:<fpage>312</fpage>.
                    <pub-id pub-id-type="pmid">23174036</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-13-312</pub-id>
                    <pub-id pub-id-type="pmcid">3554476</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-14">
                <label>14</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Jansen</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>van Hintum</surname>
                            <given-names>T</given-names>
                        </name>
					</person-group>:
                    <article-title>Genetic distance sampling: a novel sampling method for obtaining core collections using genetic distances with an application to cultivated lettuce.</article-title>
                    <source>
						
                        <italic toggle="yes">Theor Appl Genet.</italic>
					</source>
                    <year>2007</year>;<volume>114</volume>(<issue>3</issue>):<fpage>421</fpage>&#x2013;<lpage>8</lpage>.
                    <pub-id pub-id-type="pmid">17180377</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s00122-006-0433-9</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-15">
                <label>15</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Gouesnard</surname>
                            <given-names>B</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Bataillon</surname>
                            <given-names>TM</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Decoux</surname>
                            <given-names>G</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>MSTRAT: An algorithm for building germ plasm core collections by maximizing allelic or phenotypic richness.</article-title>
                    <source>
						
                        <italic toggle="yes">J Hered.</italic>
					</source>
                    <year>2001</year>;<volume>92</volume>(<issue>1</issue>):<fpage>93</fpage>&#x2013;<lpage>94</lpage>.
                    <pub-id pub-id-type="pmid">11336240</pub-id>
                    <pub-id pub-id-type="doi">10.1093/jhered/92.1.93</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-16">
                <label>16</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Franco</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Crossa</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Ribaut</surname>
                            <given-names>JM</given-names>
                        </name>
					</person-group>:
                    <article-title>A method for combining molecular markers and phenotypic attributes for classifying plant genotypes.</article-title>
                    <source>
						
                        <italic toggle="yes">Theor Appl Genet.</italic>
					</source>
                    <year>2001</year>;<volume>103</volume>(<issue>6&#x2013;7</issue>):<fpage>944</fpage>&#x2013;<lpage>952</lpage>.
                    <pub-id pub-id-type="doi">10.1007/s001220100641</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-17">
                <label>17</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Kwan</surname>
                            <given-names>HK</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Arniker</surname>
                            <given-names>SB</given-names>
                        </name>
					</person-group>:
                    <article-title>Numerical representation of DNA sequences</article-title>.
                    <source>In 
                        <italic toggle="yes">IEEE International Conference on Electro/Information Technology.</italic>
					</source>
                    <year>2009</year>;<fpage>307</fpage>&#x2013;<lpage>310</lpage>.
                    <pub-id pub-id-type="doi">10.1109/EIT.2009.5189632</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-18">
                <label>18</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Dossou-aminon</surname>
                            <given-names>I</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Loko</surname>
                            <given-names>LY</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Adjatin</surname>
                            <given-names>A</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Genetic divergence in Northern Benin Sorghum (
                        <italic toggle="yes">Sorghum bicolor</italic> L. Moench) landraces as revealed by agromorphological traits and selection of candidate genotypes.</article-title>
                    <source>
						
                        <italic toggle="yes">ScientificWorldJournal.</italic>
					</source>
                    <year>2015</year>;<volume>2015</volume>:<fpage>e916476</fpage>.
                    <pub-id pub-id-type="pmid">25729773</pub-id>
                    <pub-id pub-id-type="doi">10.1155/2015/916476</pub-id>
                    <pub-id pub-id-type="pmcid">4333270</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-19">
                <label>19</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Stein</surname>
                            <given-names>EM</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Weiss</surname>
                            <given-names>G</given-names>
                        </name>
					</person-group>:
                    <article-title>The Fourier Transform.</article-title>In
                    <italic toggle="yes">Introduction to Fourier analysis on Euclidean Spaces.</italic>Princeton University Press.<year>1971</year>.
                    <ext-link ext-link-type="uri" xlink:href="http://press.princeton.edu/titles/1978.html">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-20">
                <label>20</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Cooley</surname>
                            <given-names>JW</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Tukey</surname>
                            <given-names>JW</given-names>
                        </name>
					</person-group>:
                    <article-title>An algorithm for the machine calculation of complex Fourier series.</article-title>
                    <source>
						
                        <italic toggle="yes">Math Comput.</italic>
					</source>
                    <year>1965</year>;<fpage>297</fpage>&#x2013;<lpage>301</lpage>.
                    <pub-id pub-id-type="doi">10.2307/2003354</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-21">
                <label>21</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Nagarajan</surname>
                            <given-names>N</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Keich</surname>
                            <given-names>U</given-names>
                        </name>
					</person-group>:
                    <article-title>FAST: Fourier transform based algorithms for significance testing of ungapped multiple alignments.</article-title>
                    <source>
						
                        <italic toggle="yes">Bioinformatics.</italic>
					</source>
                    <year>2008</year>;<volume>24</volume>(<issue>4</issue>):<fpage>577</fpage>&#x2013;<lpage>8</lpage>.
                    <pub-id pub-id-type="pmid">18180239</pub-id>
                    <pub-id pub-id-type="doi">10.1093/bioinformatics/btm594</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-22">
                <label>22</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Borrayo</surname>
                            <given-names>E</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Mendizabal-Ruiz</surname>
                            <given-names>EG</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>V&#x00e9;lez-P&#x00e9;rez</surname>
                            <given-names>H</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Genomic signal processing methods for computation of alignment-free distances from DNA sequences.</article-title>
                    <source>
						
                        <italic toggle="yes">PLoS One.</italic>
					</source>
                    <year>2014</year>;<volume>9</volume>(<issue>11</issue>):<fpage>e110954</fpage>.
                    <pub-id pub-id-type="pmid">25393409</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0110954</pub-id>
                    <pub-id pub-id-type="pmcid">4230918</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-23">
                <label>23</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>JC</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Hu</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>HM</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>A strategy on constructing core collections by least distance stepwise sampling.</article-title>
                    <source>
						
                        <italic toggle="yes">Theor Appl Genet.</italic>
					</source>
                    <year>2007</year>;<volume>115</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>8</lpage>.
                    <pub-id pub-id-type="pmid">17404701</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s00122-007-0533-1</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-24">
                <label>24</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Hirano</surname>
                            <given-names>R</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Naito</surname>
                            <given-names>K</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Fukunaga</surname>
                            <given-names>K</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Genetic structure of landraces in foxtail millet (
                        <italic toggle="yes">Setaria italica</italic> (L.) P. Beauv.) revealed with transposon display and interpretation to crop evolution of foxtail millet.</article-title>
                    <source>
						
                        <italic toggle="yes">Genome.</italic>
					</source>
                    <year>2011</year>;<volume>54</volume>(<issue>6</issue>):<fpage>498</fpage>&#x2013;<lpage>506</lpage>.
                    <pub-id pub-id-type="pmid">21623678</pub-id>
                    <pub-id pub-id-type="doi">10.1139/g11-015</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-25">
                <label>25</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Odong</surname>
                            <given-names>TL</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>van Heerwaarden</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Jansen</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Determination of genetic structure of germplasm collections: are traditional hierarchical clustering methods appropriate for molecular marker data?</article-title>
                    <source>
						
                        <italic toggle="yes">Theor Appl Genet.</italic>
					</source>
                    <year>2011</year>;<volume>123</volume>(<issue>2</issue>):<fpage>195</fpage>&#x2013;<lpage>205</lpage>.
                    <pub-id pub-id-type="pmid">21472410</pub-id>
                    <pub-id pub-id-type="doi">10.1007/s00122-011-1576-x</pub-id>
                    <pub-id pub-id-type="pmcid">3114091</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-26">
                <label>26</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Cericola</surname>
                            <given-names>F</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Portis</surname>
                            <given-names>E</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Toppino</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>The population structure and diversity of eggplant from Asia and the Mediterranean Basin.</article-title>
                    <source>
						
                        <italic toggle="yes">PLoS One.</italic>
					</source>
                    <year>2013</year>;<volume>8</volume>(<issue>9</issue>):<fpage>e73702</fpage>.
                    <pub-id pub-id-type="pmid">24040032</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pone.0073702</pub-id>
                    <pub-id pub-id-type="pmcid">3765357</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-27">
                <label>27</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Mei</surname>
                            <given-names>Y</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Xu</surname>
                            <given-names>H</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Development of sea island cotton (&#x2019;
                        <italic toggle="yes">Gossypium barbadense</italic>&#x2019;L.) Core collection using genotypic values.</article-title>
                    <source>
						
                        <italic toggle="yes">Aust J Crop Sci.</italic>
					</source>
                    <year>2012</year>;<volume>6</volume>(<issue>4</issue>):<fpage>673</fpage>&#x2013;<lpage>680</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.cropj.com/xu_6_4_2012_673_680.pdf">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-28">
                <label>28</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Redelings</surname>
                            <given-names>BD</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Suchard</surname>
                            <given-names>MA</given-names>
                        </name>
					</person-group>:
                    <article-title>Joint Bayesian estimation of alignment and phylogeny.</article-title>
                    <source>
						
                        <italic toggle="yes">Syst Biol.</italic>
					</source>
                    <year>2005</year>;<volume>54</volume>(<issue>3</issue>):<fpage>401</fpage>&#x2013;<lpage>18</lpage>.
                    <pub-id pub-id-type="pmid">16012107</pub-id>
                    <pub-id pub-id-type="doi">10.1080/10635150590947041</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-29">
                <label>29</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Cristea</surname>
                            <given-names>PD</given-names>
                        </name>
					</person-group>:
                    <article-title>Conversion of nucleotides sequences into genomic signals.</article-title>
                    <source>
						
                        <italic toggle="yes">J Cell Mol Med.</italic>
					</source>
                    <year>2002</year>;<volume>6</volume>(<issue>2</issue>):<fpage>279</fpage>&#x2013;<lpage>303</lpage>.
                    <pub-id pub-id-type="pmid">12169214</pub-id>
                    <pub-id pub-id-type="doi">10.1111/j.1582-4934.2002.tb00196.x</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-30">
                <label>30</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Rosen</surname>
                            <given-names>GL</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Sokhansanj</surname>
                            <given-names>BA</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Polikar</surname>
                            <given-names>R</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Signal processing for metagenomics: extracting information from the soup.</article-title>
                    <source>
						
                        <italic toggle="yes">Curr Genomics.</italic>
					</source>
                    <year>2009</year>;<volume>10</volume>(<issue>7</issue>):<fpage>493</fpage>&#x2013;<lpage>510</lpage>.
                    <pub-id pub-id-type="pmid">20436876</pub-id>
                    <pub-id pub-id-type="doi">10.2174/138920209789208255</pub-id>
                    <pub-id pub-id-type="pmcid">2808676</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-31">
                <label>31</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>L</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Schonfeld</surname>
                            <given-names>D</given-names>
                        </name>
					</person-group>:
                    <article-title>Mapping Equivalence for Symbolic Sequences: Theory and Applications.</article-title>
                    <source>
						
                        <italic toggle="yes">IEEE Trans Signal Process.</italic>
					</source>
                    <year>2009</year>;<volume>57</volume>(<issue>12</issue>):<fpage>4895</fpage>&#x2013;<lpage>4905</lpage>.
                    <pub-id pub-id-type="doi">10.1109/TSP.2009.2026544</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-32">
                <label>32</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Almeida</surname>
                            <given-names>JS</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Vinga</surname>
                            <given-names>S</given-names>
                        </name>
					</person-group>:
                    <article-title>Universal sequence map (USM) of arbitrary discrete sequences.</article-title>
                    <source>
						
                        <italic toggle="yes">BMC Bioinformatics.</italic>
					</source>
                    <year>2002</year>;<volume>3</volume>(<issue>1</issue>):<fpage>6</fpage>.
                    <pub-id pub-id-type="pmid">11895567</pub-id>
                    <pub-id pub-id-type="doi">10.1186/1471-2105-3-6</pub-id>
                    <pub-id pub-id-type="pmcid">90187</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-33">
                <label>33</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Akhtar</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Epps</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Ambikairajah</surname>
                            <given-names>E</given-names>
                        </name>
					</person-group>:
                    <article-title>Signal Processing in Sequence Analysis: Advances in Eukaryotic Gene Prediction.</article-title>
                    <source>
						
                        <italic toggle="yes">IEEE J Sel Top Signal Process.</italic>
					</source>
                    <year>2008</year>;<volume>2</volume>(<issue>3</issue>):<fpage>310</fpage>&#x2013;<lpage>321</lpage>.
                    <pub-id pub-id-type="doi">10.1109/JSTSP.2008.923854</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-34">
                <label>34</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Franco</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Crossa</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Taba</surname>
                            <given-names>S</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>A Sampling Strategy for Conserving Genetic Diversity when Forming Core Subsets.</article-title>
                    <source>
						
                        <italic toggle="yes">Crop Sci.</italic>
					</source>
                    <year>2005</year>;<volume>45</volume>(<issue>3</issue>):<fpage>1035</fpage>&#x2013;<lpage>1044</lpage>.
                    <pub-id pub-id-type="doi">10.2135/cropsci2004.0292</pub-id>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
</article>
