<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2017.01748</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Genetic Variation and Population Structure of <italic>Oryza glaberrima</italic> and Development of a Mini-Core Collection Using DArTseq</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Ndjiondjop</surname> <given-names>Marie-Noelle</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/483779/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Semagn</surname> <given-names>Kassa</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/465276/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gouda</surname> <given-names>Arnaud C.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/474291/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Kpeki</surname> <given-names>S&#x000E8;djro B.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/466539/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Dro Tia</surname> <given-names>Daniel</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Sow</surname> <given-names>Mounirou</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/466723/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Goungoulou</surname> <given-names>Alphonse</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/483556/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sie</surname> <given-names>Moussa</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/476714/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Perrier</surname> <given-names>Xavier</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/478348/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Ghesquiere</surname> <given-names>Alain</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Warburton</surname> <given-names>Marilyn L.</given-names></name>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Africa Rice Center (AfricaRice)</institution>, <addr-line>Bouake</addr-line>, <country>Cote d&#x00027;Ivoire</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Agriculture, Forestry and Nutrition Science, University of Alberta</institution>, <addr-line>Edmonton</addr-line>, <country>Canada</country></aff>
<aff id="aff3"><sup>3</sup><institution>Africa Rice Center (AfricaRice)</institution>, <addr-line>Ibadan</addr-line>, <country>Nigeria</country></aff>
<aff id="aff4"><sup>4</sup><institution>Africa Rice Center (AfricaRice), Centre National de la Recherche Appliqu&#x000E9;e au D&#x000E9;veloppement Rural (FOFIFA)</institution>, <addr-line>Antananarivo</addr-line>, <country>Madagascar</country></aff>
<aff id="aff5"><sup>5</sup><institution>Unit&#x000E9; Mixte de Recherche Am&#x000E9;lioration G&#x000E9;n&#x000E9;tique, CIRAD</institution>, <addr-line>Montpellier</addr-line>, <country>France</country></aff>
<aff id="aff6"><sup>6</sup><institution>University of Montpellier</institution>, <addr-line>Montpellier</addr-line>, <country>France</country></aff>
<aff id="aff7"><sup>7</sup><institution>Plant Diversity Adaptation and Development Research Unit, Institut de Recherche pour le D&#x000E9;veloppement - Universit&#x000E9; de Montpellier</institution>, <addr-line>Montpellier</addr-line>, <country>France</country></aff>
<aff id="aff8"><sup>8</sup><institution>Corn Host Plant Resistance Research Unit, United States Department of Agriculture, Agricultural Research Service</institution>, <addr-line>Starkville, Mississippi</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Petr Sm&#x000FD;kal, Palack&#x000FD; University, Czechia</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Christopher M. Richards, National Laboratory for Genetic Resource Preservation (ARS-USDA), United States; Hamid Khazaei, University of Saskatchewan, Canada</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: Marie-Noelle Ndjiondjop <email>m.ndjiondjop&#x00040;cgiar.org</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Crop Science and Horticulture, a section of the journal Frontiers in Plant Science</p></fn></author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>10</month>
<year>2017</year>
</pub-date>
<pub-date pub-type="collection">
<year>2017</year>
</pub-date>
<volume>8</volume>
<elocation-id>1748</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>08</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>25</day>
<month>09</month>
<year>2017</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2017 Ndjiondjop, Semagn, Gouda, Kpeki, Dro Tia, Sow, Goungoulou, Sie, Perrier, Ghesquiere and Warburton.</copyright-statement>
<copyright-year>2017</copyright-year>
<copyright-holder>Ndjiondjop, Semagn, Gouda, Kpeki, Dro Tia, Sow, Goungoulou, Sie, Perrier, Ghesquiere and Warburton</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>The sequence variation present in accessions conserved in genebanks can best be used in plant improvement when it is properly characterized and published. Using low cost and high density single nucleotide polymorphism (SNP) assays, the genetic diversity, population structure, and relatedness between pairs of accessions can be quickly assessed. This information is relevant for different purposes, including creating core and mini-core sets that represent the maximum possible genetic variation contained in the whole collection. Here, we studied the genetic variation and population structure of 2,179 <italic>Oryza glaberrima</italic> Steud. accessions conserved at the AfricaRice genebank using 27,560 DArTseq-based SNPs. Only 14% (3,834 of 27,560) of the SNPs were polymorphic across the 2,179 accessions, which is much lower than diversity reported in other <italic>Oryza</italic> species. Genetic distance between pairs of accessions varied from 0.005 to 0.306, with 1.5% of the pairs nearly identical, 8.0% of the pairs similar, 78.1% of the pairs moderately distant, and 12.4% of the pairs very distant. The number of redundant accessions that contribute little or no new genetic variation to the <italic>O. glaberrima</italic> collection was very low. Using the maximum length sub-tree method, we propose a subset of 1,330 and 350 accessions to represent a core and mini-core collection, respectively. The core and mini-core sets accounted for &#x0007E;61 and 16%, respectively, of the whole collection, and captured 97&#x02013;99% of the SNP polymorphism and nearly all allele and genotype frequencies observed in the whole <italic>O. glaberrima</italic> collection available at the AfricaRice genebank. Cluster, principal component and model-based population structure analyses all divided the 2,179 accessions into five groups, based roughly on country of origin but less so on ecology. The first, third and fourth groups consisted of accessions primarily from Liberia, Nigeria, and Mali, respectively; the second group consisted primarily of accessions from Togo and Nigeria; and the fifth and smallest group was a mixture of accessions from multiple countries. Analysis of molecular variance showed between 10.8 and 28.9% of the variation among groups with the remaining 71.1&#x02013;89.2% attributable to differences within groups.</p></abstract>
<kwd-group>
<kwd>African rice</kwd>
<kwd>plant genetic resources</kwd>
<kwd><italic>O. glaberrima</italic></kwd>
<kwd>core collection</kwd>
<kwd>genetic differentiation</kwd>
<kwd>genetic diversity</kwd>
<kwd>SNP</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="5"/>
<equation-count count="0"/>
<ref-count count="88"/>
<page-count count="19"/>
<word-count count="12692"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>The ability of individuals, populations or species to adapt to changing environments is directly dependent on the amount of genetic variation (diversity) they possess (Frankham, <xref ref-type="bibr" rid="B26">2005</xref>). In general, higher genetic diversity provides greater ability to adapt to changes in environmental conditions, while lower genetic diversity results in uniformity and reduces adaptability (Luan et al., <xref ref-type="bibr" rid="B43">2006</xref>), which in turn increases the chance for extinction. Furthermore, plant breeders need sequence variation in breeding populations to accelerate gain from selection to improve yield, resistance to biotic and abiotic stresses, and other traits. Some of this genetic variation is present in genebank accessions, and may be used if properly cataloged; this may include finding specific new traits, or selection of parental combinations for developing progeny with maximum genetic variability for further selection (Barrett and Kidwell, <xref ref-type="bibr" rid="B5">1998</xref>). Knowledge of genetic diversity and population structure is also useful for essential genebank tasks, including creating core and mini-core sets that represent the variation available in the whole collection, in a more manageable sample size (Yan et al., <xref ref-type="bibr" rid="B85">2007</xref>; Agrama et al., <xref ref-type="bibr" rid="B1">2009</xref>; El Bakkali et al., <xref ref-type="bibr" rid="B20">2013</xref>); establishing benchmark data to serve as a baseline for estimating possible loss of genetic diversity during conservation (Reif et al., <xref ref-type="bibr" rid="B62">2005</xref>); estimating the relative strengths of the evolutionary forces of genetic drift, natural selection, mutation, and gene flow on populations <italic>ex situ</italic> or <italic>in situ</italic> (Falconer and MacKay, <xref ref-type="bibr" rid="B25">1996</xref>; Ouborg et al., <xref ref-type="bibr" rid="B56">1999</xref>); and identifying gaps in genebank collections (Brown, <xref ref-type="bibr" rid="B9">1989</xref>).</p>
<p>Genebanks aim to conserve germplasm that represent distinct combinations of genes and alleles that may confer adaptive potential for a wide range of economically important traits (McCouch et al., <xref ref-type="bibr" rid="B45">2012</xref>). In most cases, however, only a small fraction of germplasm conserved at genebanks has been characterized in detail due to (i) technical and financial constraints in conducting detailed phenotypic evaluation of large germplasm collections in multiple environments; and (ii) lack of low cost, high-throughput, and high density molecular marker assays. In such cases, the development of core and mini-core sets would speed detailed phenotypic evaluation of target traits of interest under field or controlled conditions to provide information essential for breeding and gene discovery (Agrama et al., <xref ref-type="bibr" rid="B1">2009</xref>; Tiwari et al., <xref ref-type="bibr" rid="B78">2015</xref>). Different types of molecular markers have been used to characterize the genetic diversity and population structure of germplasm conserved in genebanks (Semagn et al., <xref ref-type="bibr" rid="B69">2006</xref>; Sharma, <xref ref-type="bibr" rid="B73">2017</xref>), but single nucleotide polymorphism (SNP) assays are popular due to their abundance, locus-specificity, low error rates, co-dominant inheritance, and potential for high throughput analysis (Rafalski, <xref ref-type="bibr" rid="B61">2002</xref>; Schlotterer, <xref ref-type="bibr" rid="B66">2004</xref>). SNP data can be obtained using numerous uniplex or multiplex genotyping platforms (Syvanen, <xref ref-type="bibr" rid="B75">2001</xref>; Chen and Sullivan, <xref ref-type="bibr" rid="B12">2003</xref>), but most are expensive for high density genotyping of large numbers of genebank accessions.</p>
<p>The recent development of next-generation sequencing based genotyping technologies, such as genotyping by sequencing (GBS) (Elshire et al., <xref ref-type="bibr" rid="B21">2011</xref>) and the diversity arrays technology-based sequencing (DArTseq) platform (Sansaloni et al., <xref ref-type="bibr" rid="B65">2011</xref>) generate high density SNP information with significantly reduced genotyping cost, allowing detailed molecular characterization of germplasm conserved in genebanks. While GBS has become a popular SNP genotyping method that generates up to a million SNPs per sample (Elshire et al., <xref ref-type="bibr" rid="B21">2011</xref>; Crossa et al., <xref ref-type="bibr" rid="B15">2013</xref>; Ertiro et al., <xref ref-type="bibr" rid="B22">2015</xref>), the technology has some limitations, including a relatively large proportion of missing data points (Beissinger et al., <xref ref-type="bibr" rid="B6">2013</xref>; Nazzicari et al., <xref ref-type="bibr" rid="B52">2016</xref>), and high allele calling error-rates due to low read coverage and when genotyping heterogeneous and highly heterozygous germplasm (Semagn et al., <xref ref-type="bibr" rid="B68">2015</xref>). Some of these drawbacks have been dealt with through intensive post data correction, including implementation of reliable imputation methods, re-analyzing/re-examining old data using improved computational tools, and increasing read coverage (Semagn et al., <xref ref-type="bibr" rid="B68">2015</xref>; Furuta et al., <xref ref-type="bibr" rid="B27">2017</xref>). DArTseq has been used as an alternative to GBS; while it generates lower density SNP information (ranging from a few thousand to 350,000 SNPs depending on the species), it has relatively better coverage and lower levels of missing data (Chen et al., <xref ref-type="bibr" rid="B11">2016</xref>). The DArTseq assay has been used for studies of several species, including <italic>Oryza sativa</italic> spp. japonica (Courtois et al., <xref ref-type="bibr" rid="B14">2013</xref>), <italic>Zea mays</italic> L (Chen et al., <xref ref-type="bibr" rid="B11">2016</xref>; dos Santos et al., <xref ref-type="bibr" rid="B17">2016</xref>), <italic>Triticum turgidum</italic> L. (Baloch et al., <xref ref-type="bibr" rid="B3">2017</xref>), 16 taxonomic units of the genus <italic>Secale</italic> (Al-Beyroutiov&#x000E1; et al., <xref ref-type="bibr" rid="B2">2016</xref>), <italic>Citrullus lanatus</italic> (Thunb.) Matsum. and Nakai (Ren et al., <xref ref-type="bibr" rid="B63">2015</xref>; Yang et al., <xref ref-type="bibr" rid="B87">2016</xref>), and 13 genotypes from the genus <italic>Ananas</italic> that represent from primitive wild accessions to modern cultivars (Kilian et al., <xref ref-type="bibr" rid="B35">2016</xref>), among others.</p>
<p>Rice is the second largest crop in total global production after maize (<ext-link ext-link-type="uri" xlink:href="http://www.fao.org/faostat/en/#data">http://www.fao.org/faostat/en/#data</ext-link>; accessed in Sept. 2017) and feeds more people than any other crop (Maclean et al., <xref ref-type="bibr" rid="B44">2002</xref>). It belongs to the genus <italic>Oryza</italic>, which consists of several wild and two cultivated species - the African rice (<italic>O. glaberrima</italic> Steud.) and the Asian rice (<italic>O. sativa</italic> L.). Although the International Rice Research Institute (IRRI) genebank in the Philippines conserves the largest collection of rice germplasm, the Africa Rice Center (AfricaRice) genebank also conserves approximately 22,000 registered rice samples that represent five African indigenous wild species (<italic>O. barthii, O. longistaminata, O. eichingery, O. punctate</italic>, and <italic>O. branchyata</italic>), as well as both modern and traditional <italic>O. glaberrima</italic> and <italic>O. sativa</italic> varieties. <italic>O. glaberrima</italic> accounts for approximately 14% of the collection at the AfricaRice genebank. Efforts have been made to characterize the <italic>O. glaberrima</italic> germplasm conserved at the AfricaRice genebank using phenotypic traits (Montcho et al., <xref ref-type="bibr" rid="B49">2013</xref>; Mokuwa et al., <xref ref-type="bibr" rid="B48">2014</xref>), molecular markers (Joshi et al., <xref ref-type="bibr" rid="B34">2000</xref>; Ishii et al., <xref ref-type="bibr" rid="B32">2001</xref>; Park et al., <xref ref-type="bibr" rid="B57">2003</xref>; Semon et al., <xref ref-type="bibr" rid="B72">2005</xref>; Kwon et al., <xref ref-type="bibr" rid="B37">2006</xref>; Dram&#x000E9; et al., <xref ref-type="bibr" rid="B16">2011</xref>; Mokuwa et al., <xref ref-type="bibr" rid="B48">2014</xref>; Orjuela et al., <xref ref-type="bibr" rid="B55">2014</xref>; Meyer et al., <xref ref-type="bibr" rid="B47">2016</xref>), and DNA sequencing (Li et al., <xref ref-type="bibr" rid="B40">2011</xref>; Wang et al., <xref ref-type="bibr" rid="B80">2014</xref>). However, most of the previous genetic characterization studies were done on small numbers of accessions using few phenotypic traits and/or molecular markers. To improve characterization of the collection, the AfricaRice genebank used DArTseq to determine the genetic variation and population structure of the entire rice collection conserved in its genebank. This information is being used to create core and mini-core sets of germplasm representing the entire gene pool of each <italic>Oryza</italic> species conserved in the genebank; and to develop quality control genotyping methods to track seed identity, genetic purity, and minimize human error, including stray pollen contamination during regeneration, undesired mixing of seed lots, and labeling/handling errors. The objectives of the present study were to use the DArTseq data to (i) investigate the genetic variation, relatedness and population structure of <italic>O. glaberrima</italic> collection available at the AfricaRice genebank and (ii) create core and mini-core sets of accessions that capture most of the genetic variation of the whole <italic>O. glaberrima</italic> collection conserved at the AfricaRice genebank. This will aid breeders to efficiently tap the available sequence diversity of the collection to create improved cultivars.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and methods</title>
<sec>
<title>Plant materials and phenotyping</title>
<p>A total of 2,223 cultivated <italic>O. glaberrima</italic> accessions conserved at the AfricaRice (previously called the West Africa Rice Development Association, WARDA), genebank was initially used in this study (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). The accessions originated from 23 countries, with each country represented from one accession each from the Democratic Republic of Congo and Burundi to 575 accessions from Nigeria. Between 1973 and 1989, AfricaRice received germplasm collections for several <italic>Oryza</italic> species from the Office de la Recherche Scientifique et Technique d&#x00027;Outre-Mer (ORSTOM) in France, Institute de Recherche d&#x00027;Afrique Tropicale (IRAT) in France, the International Institute for Tropical Agriculture (IITA) in Nigeria, the Central Agricultural Research Institute (CARI) in Liberia, and the Kogoshima University in Liberia. Additional collections were made by AfricaRice scientists and collaborators to fill collection gaps of the different <italic>Oryza</italic> species growing across floating, mangrove, swamp, hydromorphic, irrigated lowland, rainfed lowland, and upland growing ecologies in Africa. Nearly 92% of the 2,223 accessions used in the present study originate from eight countries, which includes Nigeria (25.9%), Liberia (23.5%), Mali (12.2%), Togo (10.3%), Guinea Conakry (6.8), C&#x000F4;te d&#x00027;Ivoire (Ivory Coast) (4.9%), Senegal (4.8%) and Burkina Faso (3.3%) (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). AfricaRice was created in the early 1970s in Monrovia, Liberia. Because of the civil disturbances in Liberia, however, AfricaRice moved its headquarter from Liberia to the Ivory Coast in 1987/1988. During the civil disturbance and relocation period, part of the passport data was lost, which forced the AfricaRice genebank staff to register several accessions with missing passport data either to Liberia (the former AfricaRice head office) or Nigeria where many rice collections were received from IITA, which may have contributed to the larger proportion of accessions originated from both Liberia and Nigeria as compared with all other countries.</p>
<p>To update the phenotypic descriptors of the whole <italic>O. glaberrima</italic> collection by growing them in the same environmental conditions, we evaluated each accession in a three-row plot of 0.4 m wide &#x000D7; 1.0 m long under sprinkler irrigation at the AfricaRice experimental field in Cotonou, Benin (6&#x000B0; 25&#x02032; N latitude and at 2&#x000B0; 20&#x02032; E longitude). Seeds were directly sown in the field with a spacing of 0.20 m between rows and 1 m between accessions in August 2016 using randomized incomplete block design with a single replication; standard agronomic practices and inputs were used. For each accession, seven phenotypic traits were recorded on 5 randomly selected plants from the inner row of each plot using the Standard Evaluation System for Rice (<ext-link ext-link-type="uri" xlink:href="http://www.knowledgebank.irri.org/ses/SES.htm">http://www.knowledgebank.irri.org/ses/SES.htm</ext-link>; accessed in Sept. 2017). Days to heading was recorded as the number of days from seeding until 50% of the panicles had headed. Total number of tillers per plant was counted at maximum tillering, while number of fertile tillers per plant were counted at maturity when about 50% of the panicles in a plot lost their greenness. Plant height was measured from the base of the plants to the tip of heads, excluding awns, at maturity. Panicle length was measured from the panicle neck to the panicle tip, excluding awns, at maturity.</p>
</sec>
<sec>
<title>DNA extraction and genotyping</title>
<p>Genomic DNA was extracted from a single plant per accession from screenhouse grown 3-weeks old seedling in 2016 using the cetyltrimethyl ammonium bromide (CTAB) method (Murray and Thompson, <xref ref-type="bibr" rid="B51">1980</xref>), with minor modifications. DNA concentration was measured using a SmartSpec Plus spectrophotometer (Bio-Rad, USA) as described in the user&#x00027;s manual, and normalized to 100 ng/&#x003BC;L. DNA samples were shipped to DArT Pty Ltd, Canberra, Australia and genotyped in 96-plex using the DArTseq<sup>TM</sup> technology (Sansaloni et al., <xref ref-type="bibr" rid="B65">2011</xref>; Ren et al., <xref ref-type="bibr" rid="B63">2015</xref>). The detailed methodology on complexity reduction, cloning, library construction and cleaning are described in a recent paper (Egea et al., <xref ref-type="bibr" rid="B19">2017</xref>). Amplification fragments were sequenced on the Illumina Hiseq 2500 (<ext-link ext-link-type="uri" xlink:href="http://www.illumina.com">www.illumina.com</ext-link>) and SNPs were called using the DArTsoft analytical pipeline (<ext-link ext-link-type="uri" xlink:href="http://www.diversityarrays.com/dart-technology-package-dartSoft">http://www.diversityarrays.com/dart-technology-package-dartSoft</ext-link>). A total of 31,739 SNPs were successfully called, of which approximately 18% of the SNPs had missing data points ranging from 0 to 79.7%, with an overall average missing data points of 11% (data not shown). The missing alleles of SNPs with &#x0003C;50% missing data points (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>, Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S1a</xref>) were imputed by DArT Pty Ltd as described in another study (Swarts et al., <xref ref-type="bibr" rid="B74">2014</xref>). A total of 27,560 imputed SNPs (Table <xref ref-type="table" rid="T1">1</xref>) were then received from DArT Pty Ltd that were polymorphic across 5 <italic>Oryza</italic> species sampled from the AfricaRice genebank, each SNP with a minor allele frequency of &#x0003E; 0.01.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>The chromosomal distribution of 3,834 polymorphic SNPs used for genotyping 2,179 <italic>O. glaberrima</italic> accessions, including the physical length of each chromosome covered by the SNPs (in kilobase pairs) and the average distance between SNPs.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Chromosomes</bold></th>
<th valign="top" align="center"><bold>Physical length based on 27,560 SNPs (kb)</bold></th>
<th valign="top" align="center"><bold>Initial number of polymorphic SNPs used for genotyping</bold></th>
<th valign="top" align="center"><bold>Number of SNPs polymorphic in 2,179 <italic>O. glaberrima</italic></bold></th>
<th valign="top" align="center"><bold>Average map length per SNP (kb)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Chr1</td>
<td valign="top" align="center">43,230</td>
<td valign="top" align="center">2,731</td>
<td valign="top" align="center">308</td>
<td valign="top" align="center">140</td>
</tr>
<tr>
<td valign="top" align="left">Chr2</td>
<td valign="top" align="center">35,885</td>
<td valign="top" align="center">2,446</td>
<td valign="top" align="center">285</td>
<td valign="top" align="center">126</td>
</tr>
<tr>
<td valign="top" align="left">Chr3</td>
<td valign="top" align="center">36,413</td>
<td valign="top" align="center">2,318</td>
<td valign="top" align="center">257</td>
<td valign="top" align="center">142</td>
</tr>
<tr>
<td valign="top" align="left">Chr4</td>
<td valign="top" align="center">35,498</td>
<td valign="top" align="center">2,062</td>
<td valign="top" align="center">239</td>
<td valign="top" align="center">149</td>
</tr>
<tr>
<td valign="top" align="left">Chr5</td>
<td valign="top" align="center">29,763</td>
<td valign="top" align="center">1,681</td>
<td valign="top" align="center">214</td>
<td valign="top" align="center">139</td>
</tr>
<tr>
<td valign="top" align="left">Chr6</td>
<td valign="top" align="center">31,191</td>
<td valign="top" align="center">1,866</td>
<td valign="top" align="center">235</td>
<td valign="top" align="center">133</td>
</tr>
<tr>
<td valign="top" align="left">Chr7</td>
<td valign="top" align="center">29,679</td>
<td valign="top" align="center">1,780</td>
<td valign="top" align="center">228</td>
<td valign="top" align="center">130</td>
</tr>
<tr>
<td valign="top" align="left">Chr8</td>
<td valign="top" align="center">28,429</td>
<td valign="top" align="center">1,654</td>
<td valign="top" align="center">149</td>
<td valign="top" align="center">191</td>
</tr>
<tr>
<td valign="top" align="left">Chr9</td>
<td valign="top" align="center">22,947</td>
<td valign="top" align="center">1,375</td>
<td valign="top" align="center">158</td>
<td valign="top" align="center">145</td>
</tr>
<tr>
<td valign="top" align="left">Chr10</td>
<td valign="top" align="center">23,205</td>
<td valign="top" align="center">1,444</td>
<td valign="top" align="center">224</td>
<td valign="top" align="center">104</td>
</tr>
<tr>
<td valign="top" align="left">Chr11</td>
<td valign="top" align="center">29,000</td>
<td valign="top" align="center">1,839</td>
<td valign="top" align="center">317</td>
<td valign="top" align="center">91</td>
</tr>
<tr>
<td valign="top" align="left">Chr12</td>
<td valign="top" align="center">27,505</td>
<td valign="top" align="center">1,719</td>
<td valign="top" align="center">233</td>
<td valign="top" align="center">118</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td valign="top" align="left">Unmapped</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">4,645</td>
<td valign="top" align="center">987</td>
<td valign="top" align="center">&#x02013;</td>
</tr> <tr>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">372,746</td>
<td valign="top" align="center">27,560</td>
<td valign="top" align="center">3,834</td>
<td/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Statistical analyses</title>
<p>For each SNP, polymorphism information content (PIC) values were computed using PowerMarker v.3.25 (Liu and Muse, <xref ref-type="bibr" rid="B41">2005</xref>). The proportion of observed heterozygosity in each accession was calculated using TASSEL v.5.2.37 (Bradbury et al., <xref ref-type="bibr" rid="B8">2007</xref>). A genetic distance matrix was calculated between each pair of accessions using the identity-by-state (IBS) method implemented in TASSEL v.5.2.37. Cluster analysis was performed on the genetic distance matrix using the neighbor-joining algorithm implemented in molecular evolutionary genetics analysis (MEGA) v.6.0 (Tamura et al., <xref ref-type="bibr" rid="B76">2013</xref>) and the Dissimilarity Analysis and Representation for windows (DARwin) v.6.0.14 (Perrier et al., <xref ref-type="bibr" rid="B58">2003</xref>). Population structure was evaluated using the model-based method implemented in the software package STRUCTURE v.2.3.4 (Pritchard et al., <xref ref-type="bibr" rid="B60">2000</xref>). STRUCTURE was run by varying the number of clusters (K) from 1 to 10 as described elsewhere (Semagn et al., <xref ref-type="bibr" rid="B71">2012b</xref>, <xref ref-type="bibr" rid="B70">2014</xref>); each K was repeated three times with a burn-in period of 10,000 and 10,000 MCMC (Markov Chain Monte Carlo) replications after burn-in. For each <italic>K</italic>-value, genotypes with probability of membership &#x0003E;60% were assigned to the same group, while those with &#x0003C;60% probability in any group were assigned to a &#x0201C;mixed&#x0201D; group (Yang et al., <xref ref-type="bibr" rid="B86">2011</xref>; Semagn et al., <xref ref-type="bibr" rid="B71">2012b</xref>). Principal component analysis (PCA) was performed using TASSEL v.5.2.37. The first two principal components from the PCA were plotted for visual examination in XLSTAT 2012 (Addinsof, New York, USA; <ext-link ext-link-type="uri" xlink:href="http://www.xlstat.com">www.xlstat.com</ext-link>) using the scatter plot option with the following categorical variables: countries of origin and ecologies of accessions, and group memberships obtained from cluster analysis and the model-based STRUCTURE.</p>
<p>The extent of polymorphism, heterozygosity, nucleotide diversity, and F<sub>ST</sub>-based pairwise genetic distance matrices (Holsinger and Weir, <xref ref-type="bibr" rid="B30">2009</xref>) were computed among categorical variables using ARLEQUIN v.3.5.2.2 (Excoffier and Lischer, <xref ref-type="bibr" rid="B23">2010</xref>). <italic>F</italic><sub><italic>ST</italic></sub> values are indicative of the evolutionary processes that influence the structure of genetic variation among populations or groups, with &#x0003C;0.05 indicating little, 0.05&#x02013;0.15 moderate, 0.15&#x02013;0.25 great, and &#x0003E; 0.25 very great genetic differentiation (Wright, <xref ref-type="bibr" rid="B83">1978</xref>). Analysis of molecular variance (AMOVA) (Excoffier et al., <xref ref-type="bibr" rid="B24">1992</xref>) was also computed using ARLEQUIN v.3.5.2.2 to partition the variation among and within groups of accessions belonging to the different categorical variables listed above.</p>
<p>The maximum (core) and minimum (mini-core) number of <italic>O. glaberrima</italic> accessions required to capture the majority of alleles and genetic diversity observed in the whole <italic>O. glaberrima</italic> collection were found using the maximum length sub-tree (MLST) method implemented in DARwin v.6.0.14. Sphericity index (the ratio of the lengths of external edges to the total length of the sub tree) was used in deciding the most informative number of genotypes to be retained or removed. In the presence of redundant genotypes, the sphericity index curve would be linear (in a plateau) with the initial value obtained before any genotype is removed, which is indicative of the number of redundant genotypes to be removed. The curve increases as each redundancy is removed until it reaches another plateau, at which point the minimum number of genotypes that can be retained while conserving maximum diversity has been reached (Perrier et al., <xref ref-type="bibr" rid="B58">2003</xref>). The phenotypic traits were summarized using MiniTab v14.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Initial analyses and marker polymorphism</title>
<p>Of the 27,560 SNPs (Table <xref ref-type="table" rid="T1">1</xref>) that were polymorphic across 5 <italic>Oryza</italic> species, nearly 60% (16,532 SNPs) were polymorphic across the 2,223 <italic>O. glaberrima</italic> accessions. Minor allele frequency in the <italic>O. glaberrima</italic> data set ranged from 0.010 to 0.498 (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S1c</xref>). Approximately 46% of the polymorphisms (12,698 out of the 27,560 SNPs) were found in only 44 accessions originated from 11 countries (see list of accessions at the end of Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>) that showed extremely different haplotypes as compared with all other <italic>O. glaberrima</italic> accessions. Genetic distance between pairs of the 2,223 accessions computed from the 16,532 polymorphic SNPs varied from 0.002 to 0.841, with an overall average of 0.058. The majority (87.4%) of the pairs of accessions had a genetic distance of &#x0003C; 0.05, which is extremely small as compared with just 2.7% of the pairs of accessions that had genetic distance &#x0003E; 0.300 (Figure <xref ref-type="fig" rid="F1">1</xref>). A neighbor-joining tree generated from the genetic distance matrix of the 16,532 SNPs revealed radical separation of the 44 accessions from all others (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S2</xref>). Because of this distance, and the possibility that these accessions may be natural introgressions from other <italic>Oryza</italic> species, or have been misclassified, they were excluded from further analysis. Following exclusion, only 3,834 SNPs (13.9%) were polymorphic among the remaining 2,179 accessions (Table <xref ref-type="table" rid="T2">2</xref>), each with minor allele frequency ranging from 0.010 to 0.498 (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S1c</xref>). Polymorphism information content of each of the 3,834 SNP was fairly low, varying from 0.020 to 0.375 (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S3</xref>). Approximately 74% of the 3,834 polymorphic SNPs were mapped onto one of the 12 rice chromosomes, and the remaining 26% were unmapped (Table <xref ref-type="table" rid="T1">1</xref>). The number of mapped SNPs varied from 149 on chromosome 8 to 317 on chromosome 11, with an overall average of 237 SNPs per chromosome. The physical length of each chromosome varied from 22,947 kb on chromosome 9 to 43,230 kb on chromosome 1 (Table <xref ref-type="table" rid="T1">1</xref>, Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S4</xref>) and the overall genome size was 372.7 Mb.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Frequency distribution categories of pairwise genetic distance of 2,223 <italic>O. glaberrima</italic> accessions based on 16, 532 SNPs (black fill); 2,179 accessions (after excluding the 44 most diverse accessions) based on 3,834 SNPs (orange brick fill); a core set of 1,330 accessions (blue diagonal line fill) based on 3,781 polymorphic SNPs, and a mini-core set of 350 accessions (green dashed line fill), based on 3,709 polymorphic SNPs.</p></caption>
<graphic xlink:href="fpls-08-01748-g0001.tif"/>
</fig>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Summary of the 2,179 <italic>O. glaberrima</italic> accessions used in the present study and the number of accessions selected to represent a core and mini-core sets.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Country of origin</bold></th>
<th valign="top" align="center"><bold>Final number of accessions used</bold></th>
<th valign="top" align="center"><bold>No. of accessions retained in the core set</bold></th>
<th valign="top" align="center"><bold>No. of accessions retained in the mini-core set</bold></th>
<th valign="top" align="center" colspan="6" style="border-bottom: thin solid #000000;"><bold>No. of accessions belonging to each group based on STRUCTURE at <italic>K</italic> &#x0003D; 5</bold></th>
<th valign="top" align="center" colspan="5" style="border-bottom: thin solid #000000;"><bold>No. of accessions belonging to each group based on cluster analysis</bold></th>
</tr>
<tr>
<th/>
<th/>
<th/>
<th/>
<th valign="top" align="center"><bold>Group 1</bold></th>
<th valign="top" align="center"><bold>Group 2</bold></th>
<th valign="top" align="center"><bold>Group 3</bold></th>
<th valign="top" align="center"><bold>Group 4</bold></th>
<th valign="top" align="center"><bold>Group 5</bold></th>
<th valign="top" align="center"><bold>Admixture</bold></th>
<th valign="top" align="center"><bold>Group 1</bold></th>
<th valign="top" align="center"><bold>Group 2</bold></th>
<th valign="top" align="center"><bold>Group 3</bold></th>
<th valign="top" align="center"><bold>Group 4</bold></th>
<th valign="top" align="center"><bold>Group 5</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Benin</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Burkina Faso</td>
<td valign="top" align="center">74</td>
<td valign="top" align="center">59</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">44</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">51</td>
<td valign="top" align="center">12</td>
</tr>
<tr>
<td valign="top" align="left">Burundi</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Cameroon</td>
<td valign="top" align="center">37</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">Chad</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">Congo</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Egypt</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Gambia</td>
<td valign="top" align="center">24</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left">Ghana</td>
<td valign="top" align="center">37</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">Guinea Conakry</td>
<td valign="top" align="center">145</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">22</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">49</td>
<td valign="top" align="center">69</td>
</tr>
<tr>
<td valign="top" align="left">Guinea Bissau</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">11</td>
</tr>
<tr>
<td valign="top" align="left">Ivory Coast</td>
<td valign="top" align="center">104</td>
<td valign="top" align="center">67</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">27</td>
<td valign="top" align="center">45</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">29</td>
<td valign="top" align="center">17</td>
</tr>
<tr>
<td valign="top" align="left">Liberia</td>
<td valign="top" align="center">518</td>
<td valign="top" align="center">188</td>
<td valign="top" align="center">33</td>
<td valign="top" align="center">300</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">157</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">315</td>
<td valign="top" align="center">54</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">25</td>
<td valign="top" align="center">110</td>
</tr>
<tr>
<td valign="top" align="left">Madagascar</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Mali</td>
<td valign="top" align="center">267</td>
<td valign="top" align="center">218</td>
<td valign="top" align="center">76</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">14</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">211</td>
<td valign="top" align="center">15</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">218</td>
<td valign="top" align="center">12</td>
</tr>
<tr>
<td valign="top" align="left">Niger</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Nigeria</td>
<td valign="top" align="center">563</td>
<td valign="top" align="center">410</td>
<td valign="top" align="center">136</td>
<td valign="top" align="center">30</td>
<td valign="top" align="center">191</td>
<td valign="top" align="center">232</td>
<td valign="top" align="center">16</td>
<td valign="top" align="center">47</td>
<td valign="top" align="center">47</td>
<td valign="top" align="center">31</td>
<td valign="top" align="center">230</td>
<td valign="top" align="center">251</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">28</td>
</tr>
<tr>
<td valign="top" align="left">Senegal</td>
<td valign="top" align="center">99</td>
<td valign="top" align="center">76</td>
<td valign="top" align="center">20</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">67</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">10</td>
<td valign="top" align="center">12</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">60</td>
</tr>
<tr>
<td valign="top" align="left">Sierra Leone</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left">Tanzania</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">Togo</td>
<td valign="top" align="center">226</td>
<td valign="top" align="center">86</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">210</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">214</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">6</td>
</tr>
<tr>
<td valign="top" align="left">Zambia</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">&#x02013;</td>
</tr>
<tr>
<td valign="top" align="left">Zimbabwe</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">&#x02013;</td>
<td valign="top" align="center">1</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td valign="top" align="left">Others</td>
<td valign="top" align="center">19</td>
<td valign="top" align="center">11</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">3</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">8</td>
<td valign="top" align="center">5</td>
</tr> <tr>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">2,179</td>
<td valign="top" align="center">1,330</td>
<td valign="top" align="center">350</td>
<td valign="top" align="center">387</td>
<td valign="top" align="center">536</td>
<td valign="top" align="center">283</td>
<td valign="top" align="center">374</td>
<td valign="top" align="center">493</td>
<td valign="top" align="center">106</td>
<td valign="top" align="center">404</td>
<td valign="top" align="center">686</td>
<td valign="top" align="center">303</td>
<td valign="top" align="center">438</td>
<td valign="top" align="center">348</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec>
<title>Genetic purity, distance, and relationships</title>
<p>Observed heterozygosity per accession ranged from 0 to 19.3% (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S5</xref>), with an overall average of 0.8%. Only 114 accessions (5.2% of the 2,179 accessions) had observed heterozygosity &#x0003E; 3.1% (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). Genetic distance between pair of the 2,179 accessions ranged from 0.005 to 0.306 (Supplementary Table <xref ref-type="supplementary-material" rid="SM2">S2</xref>), and the overall average distance was 0.153. As shown in Figure <xref ref-type="fig" rid="F1">1</xref> and Supplementary Table <xref ref-type="supplementary-material" rid="SM2">S2</xref>, the majority (78.1%) of the pairs of accessions had a genetic distance value that fell between 0.10 and 0.20 as compared to the 9.5 and 12.5% that fellow below 0.10 and greater than 0.20, respectively.</p>
<p>The neighbor-joining cluster analysis performed on the genetic distance matrix grouped the 2,179 accessions into five groups (Figure <xref ref-type="fig" rid="F2">2A</xref>, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). The groups clustered somewhat according to geography and country of origin. The first group consisted of 404 accessions originating from 12 countries, but the vast majority (77.9%) was from Liberia. The second group consisted of 686 accessions from 18 countries, but most accessions (65%) were from Nigeria (33.5%) and Togo (31.2%). The third group consisted of 303 accessions originating from 16 countries, of which 82.8% were from Nigeria. Group four had a total of 438 accessions from 17 countries, but Mali accounted for half (49.8%), followed by smaller contributions of over 5% from five other countries: Burkina Faso (11.6%), Guinea Conakry (11.2%), Ivory Coast (6.6%), Liberia (5.7%), and Nigeria (5.3%). The fifth group had 348 accessions from 18 countries and there was no clear majority from any single country; however, 92% of the accessions originated from 8 of 18 countries: Liberia (31.6%), Guinea Conakry (19.8%), Senegal (17.2%), Nigeria (8.0%), Ivory Coast (4.9%), Mali (3.4%), Burkina Faso (3.4%), and Guinea Bissau (3.2%) (Figure <xref ref-type="fig" rid="F2">2B</xref>, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). The clustering of accessions to the five groups also showed a pattern by ecology, although less clearly so (Figure <xref ref-type="fig" rid="F2">2C</xref>). The first group consisted of approximately 74% of the accessions from the rainfed lowland ecology; the second group was primarily a mixture of irrigated lowland and upland; the third group mostly rainfed and irrigated lowland; the fourth group mostly irrigated lowland, and the fifth group again a more balanced mixture of all ecologies (but more irrigated lowland than others).</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p><bold>(A)</bold> Neighbor-joining tree of 2,179 <italic>Oryza glaberrima</italic> accessions based on 3,834 polymorphic SNPs (G1 &#x0003D; Group 1, red font; G2 &#x0003D; Group 2, pink font; G3&#x0003D; Group 3, blue font; G4 &#x0003D; Group 4, black font; G5 &#x0003D; Group 5, aqua font); <bold>(B)</bold> summary of accessions in each group by country of origin (only countries with &#x0003E;40 accessions were listed here); <bold>(C)</bold> summary of accessions belonging to each group by ecology. See Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref> for detail group membership.</p></caption>
<graphic xlink:href="fpls-08-01748-g0002.tif"/>
</fig>
</sec>
<sec>
<title>Population structure</title>
<p>We explored population structure in the <italic>O. glaberrima</italic> germplasm conserved at the AfricaRice genebank using the model-based population structure. The log probability of the data (LnP(D)) increased between <italic>K</italic> &#x0003D; 1 and <italic>K</italic> &#x0003D; 5, and mostly reached a plateau between <italic>K</italic> &#x0003D; 5 and <italic>K</italic> &#x0003D; 10, while the ad hoc statistic &#x00394;K declined between <italic>K</italic> &#x0003D; 2 and <italic>K</italic> &#x0003D; 5 (Figure <xref ref-type="fig" rid="F3">3</xref>), which suggest the presence of up to five possible groups in the germplasm. To decide the most likely number of groups that exist in the <italic>O. glaberrima</italic> collection, we used the group memberships from STRUCTURE in plotting the first two principal components from PCA analysis. A plot of PC1 (14.6% of the variation) and PC2 (5.8%) revealed 5 groups (Figure <xref ref-type="fig" rid="F4">4</xref>) with the same pattern of groupings as the model-based population partition at <italic>K</italic> &#x0003D; 5. Nearly all individuals assigned to a group at <italic>K</italic> &#x0003D; 5 belong to the same group in the principal component analysis, with the mixed group being intermediate between the second and third groups (Figure <xref ref-type="fig" rid="F4">4B</xref>). The proportion of accessions assigned to the five groups predicted from STRUCTURE varied from 13.0% in group 3 to 24.6% in group 2 (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). Group membership obtained from STRUCTURE agreed with that of cluster analysis for 1,868 accessions (85.7%); the remaining 311 accessions (14.3%) differed in their group membership between cluster analysis and STRUCTURE. Of these, 106 accessions were assigned in to a mixed group in STRUCTURE. The other 205 accessions grouped into different STRUCTURE groups than would have been predicted by cluster analysis, including accessions that belong to the STRUCTURE G1 (8 accessions), G2 (3 accessions), G3 (32 accessions), G4 (7 accessions) and G5 (155 accessions) (Supplemental Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). Excluding accessions that were assigned in to a mixed group, nearly 76% of the accessions that showed discrepancy between the cluster analysis and STRUCTURE came from group 5. The fifth group consisted of 493 accessions from 18 countries of which 89.9% were from seven countries&#x02014;Liberia (31.8%), Guinea Conakry (18.7%), Senegal (13.6%), Nigeria (9.5%), Ivory Coast (4.1%), and Burkina Faso (3.0%) (Figure <xref ref-type="fig" rid="F3">3</xref>, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>).</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Population structure of 2,179 accessions based on 3,834 polymorphic SNPs: <bold>(A)</bold> plot of LnP(D) and an ad hoc statistic &#x00394;K calculated for K ranging from 1 to 10, with each K repeated thrice; <bold>(B)</bold> population structure at <italic>K</italic> &#x0003D; 5, with each accession represented by a single vertical line that is partitioned into K colored segments, with lengths proportional to the estimated probability membership value (y-axis); <bold>(C)</bold> frequency distribution of accessions belonging to each predicted group by country of origin, with all countries that had &#x0003C;40 accessions combined in to &#x0201C;others&#x0201D;; <bold>(D)</bold> frequency distribution of accessions belong to each predicted group by ecology, with &#x0201C;others&#x00027; referring to accessions from floating, mangrove, deep and shallow forest swamp, and hydromorphic ecologies. See Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref> for details.</p></caption>
<graphic xlink:href="fpls-08-01748-g0003.tif"/>
</fig>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>Plots of PC1 (14.6% of variation) and PC2 (5.8%) from principal component analyses of 2,179 <italic>O. glaberrima</italic> accessions genotyped with 3,834 polymorphic SNPs. The plots are based on group membership from <bold>(A)</bold> cluster analysis, <bold>(B)</bold> STRUCTURE at <italic>K</italic> &#x0003D; 5, <bold>(C)</bold> country of origin, and <bold>(D)</bold> ecology. All countries with &#x0003C; 40 accessions were combined to &#x0201C;others.&#x0201D; In the ecology plot, &#x0201C;others&#x0201D; refers to accessions from floating, mangrove, deep and shallow forest swamp, and hydromorphic ecologies, each with smaller number of accessions. See Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref> for details.</p></caption>
<graphic xlink:href="fpls-08-01748-g0004.tif"/>
</fig>
</sec>
<sec>
<title>Molecular diversity and genetic differentiation</title>
<p>Table <xref ref-type="table" rid="T3">3</xref> shows a summary of the percent polymorphism, observed heterozygosity, gene diversity, and nucleotide diversity among accessions belonging to the same categorical variables (country, ecology and predicted group membership based on cluster analysis and the model-based STRUCTURE). Of the 3,834 SNPs that were polymorphic across all 2,179 <italic>O. glaberrima</italic> accessions, the lowest (44.3%) and highest (97.8%) polymorphism was observed within accessions originating from Chad and Nigeria, respectively, which may be due mainly to the size of samples from each country. Nucleotide diversity varied from 0.055 for accessions originated from Togo to 0.161 for those from Mali. When polymorphism and nucleotide diversity among ecology groups were compared, polymorphism was the lowest in mangrove (52.8%) and highest in irrigated lowland (100%), while nucleotide diversity was the lowest in upland (0.118) and the highest (0.160) in lowland irrigated/rainfed ecologies. Accessions that belong to the first group predicted based on cluster analysis and the model-based STRUCTURE analysis showed the least polymorphism (71.2&#x02013;73.9%), while those accessions in the third group had the highest gene and nucleotide diversity (Table <xref ref-type="table" rid="T3">3</xref>).</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Summary of polymorphism and molecular diversity among accessions belonging to different hierarchical levels (country and ecology of origin of accessions plus predicted groups based on the model-based STRUCTURE at <italic>K</italic> &#x0003D; 5 and cluster analysis).</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Category</bold></th>
<th valign="top" align="left"><bold>Description</bold></th>
<th valign="top" align="left"><bold>No. of accessions</bold></th>
<th valign="top" align="center"><bold>Polymorphism (%)</bold></th>
<th valign="top" align="center"><bold>Average observed heterozygosity (Std.)</bold></th>
<th valign="top" align="center"><bold>Gene diversity (Std.)</bold></th>
<th valign="top" align="center"><bold>Average nucleotide diversity (Std.)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="7" style="background-color:#bbbdc0"><bold>COUNTRY OF ORIGIN</bold></td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Burkina Faso</td>
<td valign="top" align="left">74</td>
<td valign="top" align="center">79.6</td>
<td valign="top" align="center">0.012 (0.038)</td>
<td valign="top" align="center">0.165 (0.156)</td>
<td valign="top" align="center">0.131 (0.062)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Cameroon</td>
<td valign="top" align="left">37</td>
<td valign="top" align="center">67.0</td>
<td valign="top" align="center">0.021 (0.049)</td>
<td valign="top" align="center">0.175 (0.155)</td>
<td valign="top" align="center">0.117 (0.056)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Chad</td>
<td valign="top" align="left">18</td>
<td valign="top" align="center">44.3</td>
<td valign="top" align="center">0.017 (0.057)</td>
<td valign="top" align="center">0.269 (0.151)</td>
<td valign="top" align="center">0.119 (0.058)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Gambia</td>
<td valign="top" align="left">24</td>
<td valign="top" align="center">59.4</td>
<td valign="top" align="center">0.019 (0.049)</td>
<td valign="top" align="center">0.237 (0.164)</td>
<td valign="top" align="center">0.141 (0.068)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Ghana</td>
<td valign="top" align="left">37</td>
<td valign="top" align="center">68.3</td>
<td valign="top" align="center">0.014 (0.040)</td>
<td valign="top" align="center">0.161 (0.132)</td>
<td valign="top" align="center">0.110 (0.053)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Guinea Conakry</td>
<td valign="top" align="left">145</td>
<td valign="top" align="center">89.5</td>
<td valign="top" align="center">0.008 (0.030)</td>
<td valign="top" align="center">0.135 (0.138)</td>
<td valign="top" align="center">0.121 (0.057)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Guinea Bissau</td>
<td valign="top" align="left">14</td>
<td valign="top" align="center">52.0</td>
<td valign="top" align="center">0.008 (0.042)</td>
<td valign="top" align="center">0.248 (0.135)</td>
<td valign="top" align="center">0.129 (0.063)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Ivory Coast</td>
<td valign="top" align="left">104</td>
<td valign="top" align="center">93.0</td>
<td valign="top" align="center">0.008 (0.031)</td>
<td valign="top" align="center">0.150 (0.125)</td>
<td valign="top" align="center">0.139 (0.066)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Liberia</td>
<td valign="top" align="left">518</td>
<td valign="top" align="center">97.7</td>
<td valign="top" align="center">0.010 (0.034)</td>
<td valign="top" align="center">0.117 (0.148)</td>
<td valign="top" align="center">0.114 (0.054)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mali</td>
<td valign="top" align="left">267</td>
<td valign="top" align="center">96.1</td>
<td valign="top" align="center">0.007 (0.031)</td>
<td valign="top" align="center">0.167 (0.154)</td>
<td valign="top" align="center">0.161 (0.076)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Nigeria</td>
<td valign="top" align="left">563</td>
<td valign="top" align="center">97.8</td>
<td valign="top" align="center">0.008 (0.030)</td>
<td valign="top" align="center">0.161 (0.143)</td>
<td valign="top" align="center">0.157 (0.074)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Senegal</td>
<td valign="top" align="left">99</td>
<td valign="top" align="center">86.4</td>
<td valign="top" align="center">0.013 (0.033)</td>
<td valign="top" align="center">0.136 (0.133)</td>
<td valign="top" align="center">0.117 (0.055)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Togo</td>
<td valign="top" align="left">226</td>
<td valign="top" align="center">73.4</td>
<td valign="top" align="center">0.006 (0.034)</td>
<td valign="top" align="center">0.075 (0.126)</td>
<td valign="top" align="center">0.055 (0.026)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Others</td>
<td valign="top" align="left">53</td>
<td valign="top" align="center">90.1</td>
<td valign="top" align="center">0.007 (0.030)</td>
<td valign="top" align="center">0.180 (0.125)</td>
<td valign="top" align="center">0.160 (0.077)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7" style="background-color:#bbbdc0"><bold>ECOLOGY OF ORIGIN</bold></td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Floating</td>
<td valign="top" align="left">55</td>
<td valign="top" align="center">82.4</td>
<td valign="top" align="center">0.009 (0.035)</td>
<td valign="top" align="center">0.187 (0.151)</td>
<td valign="top" align="center">0.154 (0.073)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Hydromorphic</td>
<td valign="top" align="left">18</td>
<td valign="top" align="center">55.4</td>
<td valign="top" align="center">0.027 (0.054)</td>
<td valign="top" align="center">0.251 (0.146)</td>
<td valign="top" align="center">0.139 (0.067)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Irrigated lowland</td>
<td valign="top" align="left">804</td>
<td valign="top" align="center">100.0</td>
<td valign="top" align="center">0.008 (0.028)</td>
<td valign="top" align="center">0.154 (0.120)</td>
<td valign="top" align="center">0.154 (0.073)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Lowland irrigated/rainfed</td>
<td valign="top" align="left">353</td>
<td valign="top" align="center">97.9</td>
<td valign="top" align="center">0.010 (0.029)</td>
<td valign="top" align="center">0.164 (0.139)</td>
<td valign="top" align="center">0.160 (0.076)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mangrove</td>
<td valign="top" align="left">13</td>
<td valign="top" align="center">52.8</td>
<td valign="top" align="center">0.011 (0.044)</td>
<td valign="top" align="center">0.285 (0.133)</td>
<td valign="top" align="center">0.151 (0.074)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Rainfed lowland</td>
<td valign="top" align="left">521</td>
<td valign="top" align="center">97.6</td>
<td valign="top" align="center">0.010 (0.033)</td>
<td valign="top" align="center">0.121 (0.146)</td>
<td valign="top" align="center">0.119 (0.056)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Swamp</td>
<td valign="top" align="left">26</td>
<td valign="top" align="center">66.8</td>
<td valign="top" align="center">0.020 (0.043)</td>
<td valign="top" align="center">0.232 (0.131)</td>
<td valign="top" align="center">0.155 (0.074)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Upland</td>
<td valign="top" align="left">389</td>
<td valign="top" align="center">99.6</td>
<td valign="top" align="center">0.006 (0.028)</td>
<td valign="top" align="center">0.118 (0.119)</td>
<td valign="top" align="center">0.118 (0.056)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7" style="background-color:#bbbdc0"><bold>GROUPS BASED ON CLUSTER ANALYSIS</bold></td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 1</td>
<td valign="top" align="left">404</td>
<td valign="top" align="center">71.2</td>
<td valign="top" align="center">0.013 (0.045)</td>
<td valign="top" align="center">0.129 (0.168)</td>
<td valign="top" align="center">0.092 (0.043)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 2</td>
<td valign="top" align="left">686</td>
<td valign="top" align="center">93.8</td>
<td valign="top" align="center">0.009 (0.032)</td>
<td valign="top" align="center">0.114 (0.139)</td>
<td valign="top" align="center">0.107 (0.051)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 3</td>
<td valign="top" align="left">303</td>
<td valign="top" align="center">84.3</td>
<td valign="top" align="center">0.012 (0.034)</td>
<td valign="top" align="center">0.189 (0.175)</td>
<td valign="top" align="center">0.159 (0.075)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 4</td>
<td valign="top" align="left">438</td>
<td valign="top" align="center">92.6</td>
<td valign="top" align="center">0.008 (0.033)</td>
<td valign="top" align="center">0.167 (0.156)</td>
<td valign="top" align="center">0.155 (0.073)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 5</td>
<td valign="top" align="left">348</td>
<td valign="top" align="center">72.2</td>
<td valign="top" align="center">0.007 (0.032)</td>
<td valign="top" align="center">0.122 (0.146)</td>
<td valign="top" align="center">0.088 (0.042)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="7" style="background-color:#bbbdc0"><bold>GROUPS BASED ON STRUCTURE AT <italic>K</italic> &#x0003D; 5</bold></td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 1</td>
<td valign="top" align="left">387</td>
<td valign="top" align="center">71.7</td>
<td valign="top" align="center">0.013 (0.046)</td>
<td valign="top" align="center">0.124 (0.166)</td>
<td valign="top" align="center">0.089 (0.042)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 2</td>
<td valign="top" align="left">536</td>
<td valign="top" align="center">84.8</td>
<td valign="top" align="center">0.008 (0.034)</td>
<td valign="top" align="center">0.111 (0.151)</td>
<td valign="top" align="center">0.094 (0.044)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 3</td>
<td valign="top" align="left">283</td>
<td valign="top" align="center">81.3</td>
<td valign="top" align="center">0.013 (0.036)</td>
<td valign="top" align="center">0.198 (0.178)</td>
<td valign="top" align="center">0.160 (0.076)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 4</td>
<td valign="top" align="left">374</td>
<td valign="top" align="center">83.8</td>
<td valign="top" align="center">0.008 (0.034)</td>
<td valign="top" align="center">0.184 (0.161)</td>
<td valign="top" align="center">0.154 (0.073)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Group 5</td>
<td valign="top" align="left">493</td>
<td valign="top" align="center">89.0</td>
<td valign="top" align="center">0.007 (0.029)</td>
<td valign="top" align="center">0.167 (0.136)</td>
<td valign="top" align="center">0.095 (0.045)</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mixed</td>
<td valign="top" align="left">106</td>
<td valign="top" align="center">92.3</td>
<td valign="top" align="center">0.019 (0.034)</td>
<td valign="top" align="center">0.159 (0.126)</td>
<td valign="top" align="center">0.147 (0.069)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>All analyses were based on 2,179 O. glaberrima accessions genotyped with 3,834 polymorphic SNPs</italic>.</p>
</table-wrap-foot>
</table-wrap>
<p>When pairwise <italic>F</italic><sub>ST</sub> values were compared to understand the extent of genetic differentiation (divergence) between pairs of countries (Supplementary Table <xref ref-type="supplementary-material" rid="SM3">S3</xref>), the values were highly variable ranging from 0.020 (little genetic differentiation) to 0.420 (very great genetic differentiation). Accessions from Togo showed very great genetic differentiation (0.261&#x02013;0.420) as compared with all other countries, except moderate differentiation from Ghana (0.115) and great genetic differentiation from Nigeria (0.188). <italic>O. glaberrima</italic> accessions from Liberia showed very great genetic differentiation from those from Cameroon (0.302), Chad (0.310), and Gambia (0.282), and great differentiation from those from Burkina Faso (0.221), Ghana (0.246) and Guinea Bissau (0.218). Accessions from Mali showed great genetic differentiation from those from Liberia (0.241), Cameroon (0.175) Chad (0.165) and Gambia (0.154), and moderate differentiation from all other countries. Similarly, accessions from Nigeria showed great differentiation from those accessions from Liberia (0.217) and moderate differentiation as compared with all other countries (Supplementary Table <xref ref-type="supplementary-material" rid="SM3">S3</xref>). Neighbor-joining cluster analysis performed on the pairwise <italic>F</italic><sub>ST</sub> values computed among pairs of countries showed three clusters, which corresponds to (i) the Liberia, Senegal, Guinea Conakry, Guinea Bissau, Burkina Faso and Mali group (although Liberia was a bit of an outlier); (ii) the Nigeria, Gambia, Cameroon and Chad group, and (iii) the Ghana and Togo group, which showed the greatest within-group differentiation (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S6</xref>). The estimated pairwise fixation indices (<italic>F</italic><sub><italic>ST</italic></sub>) among eight ecologies varied from 0.026 to 0.250 (Supplementary Table <xref ref-type="supplementary-material" rid="SM3">S3</xref>), of which the rainfed lowland ecology showed the highest genetic differentiation as compared to the floating (0.246), swamp (0.224), and hydromorphic (0.250) ecologies. Neighbor-joining cluster analysis performed on the pairwise <italic>F</italic><sub>ST</sub> values computed among pairs of ecologies revealed distinct clusters for the rainfed and upland ecologies as compared to all other ecologies (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S6</xref>).</p>
<p>Results from partitioning of the overall molecular variance into different hierarchical levels revealed that differences in ecology and country of origin accounted for 10.8 and 18.1% of the genetic variation, respectively (Table <xref ref-type="table" rid="T4">4</xref>). Higher among-groups variation was also observed when the variance components were partitioned based on the number of groups predicted using cluster analysis (27.3%) and the model-based STRUCTURE at <italic>K</italic> &#x0003D; 5 (28.9%) than either countries of origin or ecologies. Pairwise <italic>F</italic><sub>ST</sub> values among accessions that belong to group 1 predicted based on cluster analysis and the model-based STRUCTURE was the highest (0.268&#x02013;0.469) as compared to the other four groups. A random permutation test indicated that the proportion of variance attributable for all hierarchical levels were highly significant (<italic>p</italic> &#x0003C; 0.001).</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p>Analysis of molecular variance (AMOVA) for the extraction of SNP variation among and within groups (populations) based on 2,179 <italic>O. glaberrima</italic> accessions genotyped with 3,834 polymorphic SNPs.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Category</bold></th>
<th valign="top" align="left"><bold>Source of variation</bold></th>
<th valign="top" align="center"><bold>d.f</bold>.</th>
<th valign="top" align="center"><bold>Sum of squares</bold></th>
<th valign="top" align="center"><bold>Variance components</bold></th>
<th valign="top" align="center"><bold>Percentage of variation</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Country of origin<xref ref-type="table-fn" rid="TN1"><sup>&#x0002A;</sup></xref></td>
<td valign="top" align="left">Among groups</td>
<td valign="top" align="center">13</td>
<td valign="top" align="center">202,566.7</td>
<td valign="top" align="center">54.5</td>
<td valign="top" align="center">18.1</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Within groups</td>
<td valign="top" align="center">4,344</td>
<td valign="top" align="center">1,072,188.8</td>
<td valign="top" align="center">246.8</td>
<td valign="top" align="center">81.9</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">4,357</td>
<td valign="top" align="center">1,274,755.5</td>
<td valign="top" align="center">301.3</td>
<td valign="top" align="center">100.0</td>
</tr> <tr>
<td valign="top" align="left">Ecology<xref ref-type="table-fn" rid="TN1"><sup>&#x0002A;</sup></xref></td>
<td valign="top" align="left">Among groups</td>
<td valign="top" align="center">7</td>
<td valign="top" align="center">107,343.2</td>
<td valign="top" align="center">32.4</td>
<td valign="top" align="center">10.8</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Within groups</td>
<td valign="top" align="center">4,350</td>
<td valign="top" align="center">1,167,789.9</td>
<td valign="top" align="center">268.5</td>
<td valign="top" align="center">89.2</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">4,357</td>
<td valign="top" align="center">1,275,133.1</td>
<td valign="top" align="center">300.9</td>
<td valign="top" align="center">100.0</td>
</tr> <tr>
<td valign="top" align="left">Groups based on STRUCTURE at K &#x0003D; 5</td>
<td valign="top" align="left">Among groups</td>
<td valign="top" align="center">5</td>
<td valign="top" align="center">316,630.5</td>
<td valign="top" align="center">89.6</td>
<td valign="top" align="center">28.9</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Within groups</td>
<td valign="top" align="center">4,352</td>
<td valign="top" align="center">958,124.9</td>
<td valign="top" align="center">220.2</td>
<td valign="top" align="center">71.1</td>
</tr>
<tr style="border-bottom: thin solid #000000;">
<td/>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">4,357</td>
<td valign="top" align="center">1,274,755.4</td>
<td valign="top" align="center">309.8</td>
<td valign="top" align="center">100.0</td>
</tr> <tr>
<td valign="top" align="left">Groups based on cluster analysis</td>
<td valign="top" align="left">Among groups</td>
<td valign="top" align="center">4</td>
<td valign="top" align="center">289,596.6</td>
<td valign="top" align="center">84.8</td>
<td valign="top" align="center">27.3</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Within groups</td>
<td valign="top" align="center">4,353</td>
<td valign="top" align="center">985,158.8</td>
<td valign="top" align="center">226.3</td>
<td valign="top" align="center">72.7</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">4,357</td>
<td valign="top" align="center">1,274,755.4</td>
<td valign="top" align="center">311.1</td>
<td valign="top" align="center">100.0</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="TN1"><label>&#x0002A;</label><p><italic>Countries of origin: Burkina Faso, Cameroon, Chad, Gambia, Ghana, Guinea Conakry, Guinea Bissau, Ivory Coast, Liberia, Mali, Nigeria, Senegal, Togo, and &#x0201C;others,&#x0201D; which consisted of all other countries with &#x0003C;10 accessions. Ecologies of origin: Floating, Hydromorphic, Irrigated lowland, Lowland irrigated/rainfed, Rainfed lowland, Mangrove, Swamp, and upland</italic>.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Creating core and mini-core collections</title>
<p>As shown in Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S7</xref>, the sphericity index was almost linear with relatively low slope until it reached to a sample size of 849 accessions on the x-axis, which suggests that the 849 accessions are not informative (highly similar with other accessions) and can be removed from the dataset without notably modifying the sphericity index (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S8a</xref>). The remaining 1,330 accessions can be chosen to represent a core collection of <italic>O. glaberrima</italic> germplasm (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S8b</xref>, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). The sphericity index increases rapidly between 849 to 1850 on the x-axis, which suggests that edges that constitute the backbone of the phylogenetic tree have been removed. Thus, the remaining 329 accessions could form the mini-core set. We propose retaining 350 accessions to represent a mini-core collection of the <italic>O. glaberrima</italic> germplasm (Figure <xref ref-type="fig" rid="F5">5</xref>, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). The selected core and mini-core sets originated from 22 and 20 countries, respectively (Table <xref ref-type="table" rid="T2">2</xref>).</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Neighbor joining tree and principal component analysis of the 350 mini-core accessions based on 3,709 of the 3,834 SNPs that were polymorphic within this set; <bold>(A)</bold> Neighbor joining tree from DARwin; and <bold>(B)</bold> plot of PC1 (10.6%) and PC2 (5.7%) from principal component analyses. Accessions belonging to each of the five groups predicted based on STRUCTURE in Figure <xref ref-type="fig" rid="F3">3</xref> are shown with the same color (Group 1, orange font; Group 2, blue font; Group 3, green font; Group 4, black font; Group 5, pink font, and mixed, red font). See Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref> for details.</p></caption>
<graphic xlink:href="fpls-08-01748-g0005.tif"/>
</fig>
<p>The genotypic data of the whole collection was compared to the data sets generated for the core and mini core sets for polymorphism, allele and genotype (combination of alleles) frequency, and genetic distance. For the 3,834 SNPs that were polymorphic in the whole <italic>O. glaberrima</italic> accessions, the reduction in sample size from 2,179 accessions to 1,330 accessions in the core and 350 accessions in the mini-core decreased the number of polymorphic SNPs only by 53 (1.4%) and 125 (3.3%), respectively. Both allele and genotype frequencies in the core and mini-core sets were the same as the whole set (Figure <xref ref-type="fig" rid="F6">6</xref>). As expected, however, genetic distance between pairs of accessions increased significantly in the core and mini-core sets (Figure <xref ref-type="fig" rid="F1">1</xref>, Supplemental Table <xref ref-type="supplementary-material" rid="SM4">S4</xref>). The proportion of pairs of accessions with genetic distance exceeding 0.10 was 90.5% for the whole set as compared with 95.3% in the core and 99.9% in the mini-core sets. The average phenotypic traits (number of tillers, days to heading, plant height, blade length, blade width, and panicle length) in the core and mini-core sets were basically the same as the whole <italic>O. glaberrima</italic> collection (Table <xref ref-type="table" rid="T5">5</xref>). The proportion of accessions selected from each group predicted based on STRUCTURE and cluster analysis was not equal, but reflected the size of each group or cluster (Figure <xref ref-type="fig" rid="F7">7A</xref>). Using the group membership from STRUCTURE, the mini-core collection comprised of 18 accessions from group 1; 36 accessions from group 2; 120 accessions from group 3; 101 accessions from group 4; 27 accessions from group 5; and 48 accessions from the admixed group. Although the selected mini-core set of accessions represent 20 countries and all 9 ecologies, the majority of them originated from 9 countries (Figure <xref ref-type="fig" rid="F7">7B</xref>) and 6 ecologies (Figure <xref ref-type="fig" rid="F7">7C</xref>).</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p>Summary of <bold>(A)</bold> allele frequencies and <bold>(B)</bold> genotype frequencies of the entire <italic>O. glaberrima</italic> accessions (<italic>N</italic> &#x0003D; 2,179) based on 3,834 polymorphic SNPs as compared with a core set of 1,330 accessions using 3,781 polymorphic SNPs, and a mini-core set of 350 accessions using 3,709 polymorphic SNPs. Nucleotide codes are as follows: A, adenine; C, cytosine; G, guanine; T, thymine; Y, C or T; R, A or G; K, G or T; M, A or C; W, A or T; S, G or C (<ext-link ext-link-type="uri" xlink:href="http://www.bioinformatics.org/sms/iupac.html">http://www.bioinformatics.org/sms/iupac.html</ext-link>; accessed in Sept. 2017).</p></caption>
<graphic xlink:href="fpls-08-01748-g0006.tif"/>
</fig>
<table-wrap position="float" id="T5">
<label>Table 5</label>
<caption><p>Summary of seven phenotypic descriptors for the core and mini-core sets as compared to the whole <italic>O. glaberrima</italic> collection based on unreplicated data evaluation at the AfricaRice experimental station in Cotonou, Benin.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Trait</bold></th>
<th valign="top" align="left"><bold>Entries</bold></th>
<th valign="top" align="center"><bold>No. of entries with no missing phenotype<xref ref-type="table-fn" rid="TN2"><sup>&#x0002A;</sup></xref></bold></th>
<th valign="top" align="center"><bold>Minimum</bold></th>
<th valign="top" align="center"><bold>Maximum</bold></th>
<th valign="top" align="center"><bold>Mean</bold></th>
<th valign="top" align="center"><bold>Standard deviation</bold></th>
<th valign="top" align="center"><bold>Coefficient of variation</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Days to 50% heading (d)</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">2,047</td>
<td valign="top" align="center">63.0</td>
<td valign="top" align="center">183.0</td>
<td valign="top" align="center">112.7</td>
<td valign="top" align="center">21.6</td>
<td valign="top" align="center">19.1</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,221</td>
<td valign="top" align="center">63.0</td>
<td valign="top" align="center">183.0</td>
<td valign="top" align="center">117.4</td>
<td valign="top" align="center">22.1</td>
<td valign="top" align="center">18.8</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">319</td>
<td valign="top" align="center">71.0</td>
<td valign="top" align="center">183.0</td>
<td valign="top" align="center">124.4</td>
<td valign="top" align="center">21.2</td>
<td valign="top" align="center">17.0</td>
</tr>
<tr>
<td valign="top" align="left">Total number of tillers</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">1,983</td>
<td valign="top" align="center">3.2</td>
<td valign="top" align="center">78.5</td>
<td valign="top" align="center">23.3</td>
<td valign="top" align="center">8.5</td>
<td valign="top" align="center">36.5</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,171</td>
<td valign="top" align="center">4.0</td>
<td valign="top" align="center">78.5</td>
<td valign="top" align="center">23.6</td>
<td valign="top" align="center">8.6</td>
<td valign="top" align="center">36.4</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">301</td>
<td valign="top" align="center">6.8</td>
<td valign="top" align="center">77.0</td>
<td valign="top" align="center">24.5</td>
<td valign="top" align="center">9.1</td>
<td valign="top" align="center">37.3</td>
</tr>
<tr>
<td valign="top" align="left">Number of fertile tillers</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">1,975</td>
<td valign="top" align="center">1.0</td>
<td valign="top" align="center">44.0</td>
<td valign="top" align="center">16.0</td>
<td valign="top" align="center">6.8</td>
<td valign="top" align="center">42.7</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,167</td>
<td valign="top" align="center">1.0</td>
<td valign="top" align="center">43.4</td>
<td valign="top" align="center">15.3</td>
<td valign="top" align="center">6.8</td>
<td valign="top" align="center">44.4</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">298</td>
<td valign="top" align="center">1.5</td>
<td valign="top" align="center">43.4</td>
<td valign="top" align="center">14.2</td>
<td valign="top" align="center">7.0</td>
<td valign="top" align="center">49.2</td>
</tr>
<tr>
<td valign="top" align="left">Plant height (cm)</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">1,980</td>
<td valign="top" align="center">82.8</td>
<td valign="top" align="center">182.0</td>
<td valign="top" align="center">130.4</td>
<td valign="top" align="center">15.8</td>
<td valign="top" align="center">12.2</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,167</td>
<td valign="top" align="center">82.8</td>
<td valign="top" align="center">182.0</td>
<td valign="top" align="center">131.3</td>
<td valign="top" align="center">16.5</td>
<td valign="top" align="center">12.6</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">297</td>
<td valign="top" align="center">86.0</td>
<td valign="top" align="center">182.0</td>
<td valign="top" align="center">132.2</td>
<td valign="top" align="center">17.7</td>
<td valign="top" align="center">13.4</td>
</tr>
<tr>
<td valign="top" align="left">Panicle length (cm)</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">1,981</td>
<td valign="top" align="center">1.9</td>
<td valign="top" align="center">58.0</td>
<td valign="top" align="center">31.9</td>
<td valign="top" align="center">6.3</td>
<td valign="top" align="center">19.7</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,169</td>
<td valign="top" align="center">1.9</td>
<td valign="top" align="center">58.0</td>
<td valign="top" align="center">31.6</td>
<td valign="top" align="center">6.7</td>
<td valign="top" align="center">21.2</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">299</td>
<td valign="top" align="center">13.4</td>
<td valign="top" align="center">58.0</td>
<td valign="top" align="center">30.5</td>
<td valign="top" align="center">6.7</td>
<td valign="top" align="center">21.9</td>
</tr>
<tr>
<td valign="top" align="left">Leaf blade length (cm)</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">1,990</td>
<td valign="top" align="center">16.7</td>
<td valign="top" align="center">75.6</td>
<td valign="top" align="center">37.0</td>
<td valign="top" align="center">8.3</td>
<td valign="top" align="center">22.4</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,175</td>
<td valign="top" align="center">16.9</td>
<td valign="top" align="center">70.1</td>
<td valign="top" align="center">36.5</td>
<td valign="top" align="center">8.6</td>
<td valign="top" align="center">23.5</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">303</td>
<td valign="top" align="center">16.9</td>
<td valign="top" align="center">70.1</td>
<td valign="top" align="center">35.7</td>
<td valign="top" align="center">9.2</td>
<td valign="top" align="center">25.6</td>
</tr>
<tr>
<td valign="top" align="left">Leaf blade width (cm)</td>
<td valign="top" align="left">All</td>
<td valign="top" align="center">1,978</td>
<td valign="top" align="center">0.8</td>
<td valign="top" align="center">3.5</td>
<td valign="top" align="center">1.8</td>
<td valign="top" align="center">0.4</td>
<td valign="top" align="center">21.1</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Core</td>
<td valign="top" align="center">1,171</td>
<td valign="top" align="center">0.8</td>
<td valign="top" align="center">3.5</td>
<td valign="top" align="center">1.7</td>
<td valign="top" align="center">0.4</td>
<td valign="top" align="center">21.3</td>
</tr>
<tr>
<td/>
<td valign="top" align="left">Mini-core</td>
<td valign="top" align="center">302</td>
<td valign="top" align="center">0.9</td>
<td valign="top" align="center">2.6</td>
<td valign="top" align="center">1.6</td>
<td valign="top" align="center">0.3</td>
<td valign="top" align="center">20.1</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>Each accession was represented by mean values of 5 randomly selected plants.</italic></p>
<fn id="TN2"><label>&#x0002A;</label><p><italic>The total number of accessions for the whole collection, core, and mini-core sets were 2,179, 1,330 and 350. Some accessions did not germinate; accessions with extremely small or large values were excluded from the phenotype data based on frequency distribution and boxplots</italic>.</p></fn>
</table-wrap-foot>
</table-wrap>
<fig id="F7" position="float">
<label>Figure 7</label>
<caption><p>The distribution of accessions selected to represent mini-core collection by <bold>(A)</bold> groups predicted based on STRUCTURE and cluster analysis; <bold>(B)</bold> countries of origin, and <bold>(C)</bold> adaptation ecologies. See Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref> for details.</p></caption>
<graphic xlink:href="fpls-08-01748-g0007.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<sec>
<title>Low genetic variation exists in the collection of <italic>O. glaberrima</italic></title>
<p>Nearly 60% of the 27,560 SNPs used for genotyping 5 rice species was initially polymorphic within the <italic>O. glaberrima</italic> collection; however, 46% of the polymorphisms were due to just 44 accessions (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>) that showed extremely different pattern as compared with all other <italic>O. glaberrima</italic> accessions (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S2</xref>). It is possible that the 44 accessions may possess rare alleles that made them very different from the remaining 2,179 <italic>O. glaberrima</italic> accessions. However, those 44 accessions may also be natural introgressions involving <italic>O. glaberrima</italic> and another <italic>Oryza</italic> species, as has been reported in other studies (Jones et al., <xref ref-type="bibr" rid="B33">1997</xref>; Semon et al., <xref ref-type="bibr" rid="B72">2005</xref>; Orjuela et al., <xref ref-type="bibr" rid="B55">2014</xref>). For example, Orjuela et al. (<xref ref-type="bibr" rid="B55">2014</xref>) reported some weedy type accessions that were intermediate between <italic>O. glaberrima</italic> and <italic>O. barthii</italic>, which were collected primarily in countries where the wild <italic>O. barthii</italic> grow near <italic>O. glaberrima</italic> fields. The presence of cultivated and wild species in the same area probably favored interspecific gene flow between two rice species, which resulted to the development of intermediate forms. Furthermore, we cannot rule out the possibility that other <italic>Oryza</italic> species were mislabeled as <italic>O. glaberrima</italic> during collection or at some stage during seed/DNA handling, DNA contamination, and/or genotyping error. These possible errors can be corrected with further study, including phenotypic evaluation of the 44 accessions in comparison with other widely used <italic>O. glaberrima</italic> accessions, and comparing the DArTseq data from the 44 accessions to data generated from other <italic>Oryza</italic> species. Due to such concerns, we presented detailed results on 2,179 accessions, excluding the 44 accessions listed in Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>.</p>
<p>When the 44 accessions described above were excluded, only 13.9% of the SNPs (3,834 of the 27,560 SNPs) were polymorphic within the remaining 2,179 <italic>O. glaberrima</italic> accessions (Table <xref ref-type="table" rid="T2">2</xref>), which is lower than the polymorphism levels observed within <italic>O. barthii</italic> (18.9%) and <italic>O. longistaminata</italic> (30.3%) (MN Ndjiondjop, unpublished). In another study, we used the same set of 27,560 SNPs for genotyping 331 widely used rice genotypes in Africa, which includes 85 &#x0201C;New Rice for Africa (NERICA)&#x0201D; improved varieties, 11 &#x0201C;Advanced Rice for Africa (ARICA)&#x0201D; varieties, 62 <italic>O. sativa</italic> spp. japonica, and 172 <italic>O. sativa</italic> spp. indica genotypes. Sixty six percent of the SNPs (18,186 of the 27,560 SNPs) were polymorphic across all 331 genotypes, of which 15,020 SNP (82.6%) were physically mapped in to one of the rice chromosomes. Of the 15,020 physically mapped SNPs, nearly 37, 43, 48, and 49%, respectively, were polymorphic within ARICA, japonica, indica, and NERICA genotypes (MN Ndjiondjop, unpublished); therefore, the level of polymorphism observed in <italic>O. sativa</italic> and interspecific NERICA genotypes was from 2.5 to 3.5 times higher than that of <italic>O. glaberrima</italic>. Several previous molecular studies conducted on <italic>O. glaberrima</italic> have also reported a narrow genetic base compared to other <italic>Oryza</italic> species (Joshi et al., <xref ref-type="bibr" rid="B34">2000</xref>; Ishii et al., <xref ref-type="bibr" rid="B32">2001</xref>; Park et al., <xref ref-type="bibr" rid="B57">2003</xref>; Semon et al., <xref ref-type="bibr" rid="B72">2005</xref>; Kwon et al., <xref ref-type="bibr" rid="B37">2006</xref>; Dram&#x000E9; et al., <xref ref-type="bibr" rid="B16">2011</xref>; Li et al., <xref ref-type="bibr" rid="B40">2011</xref>; Orjuela et al., <xref ref-type="bibr" rid="B55">2014</xref>; Wang et al., <xref ref-type="bibr" rid="B80">2014</xref>; Meyer et al., <xref ref-type="bibr" rid="B47">2016</xref>). However, these previous studies were based on small numbers of accessions and/or markers, and the very large number of accessions and SNPs in the current study is much more definitive. The low levels of diversity confirmed in the present study may be due to a severe bottleneck that occurred during its domestication (Li et al., <xref ref-type="bibr" rid="B40">2011</xref>; Wang et al., <xref ref-type="bibr" rid="B80">2014</xref>; Meyer et al., <xref ref-type="bibr" rid="B47">2016</xref>). Based on nucleotide diversity, the minor allele frequency spectrum, linkage disequilibrium (LD) and Tajima&#x00027;s <italic>D</italic>-values estimated from genome sequence data, Wang et al. (<xref ref-type="bibr" rid="B80">2014</xref>) suggested that the significant reduction in genetic diversity within <italic>O. glaberrima</italic> is a consequence of domestication, which is consistent with other studies reporting reduction in genetic diversity in domesticated crops as compared to their wild progenitors (Reif et al., <xref ref-type="bibr" rid="B62">2005</xref>; Wright et al., <xref ref-type="bibr" rid="B84">2005</xref>; Lam et al., <xref ref-type="bibr" rid="B38">2010</xref>; Huang et al., <xref ref-type="bibr" rid="B31">2012</xref>).</p>
<p><italic>O. glaberrima</italic> is a selfing species with outcrossing rates ranging from 2 to 5% (Semon et al., <xref ref-type="bibr" rid="B72">2005</xref>), even lower than many other selfing species (Barnaud et al., <xref ref-type="bibr" rid="B4">2008</xref>). As a result, most accessions were expected to display less than the average observed heterozygosity expected in S<sub>5</sub> breeding lines derived from biparental crosses (3.1%). This was seen with &#x0007E;95% of the accessions, but the remaining &#x0007E;4% (81 of 2,179 accessions) had observed heterozygosity exceeding 5% (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>), which is higher than expected in the absence of human error. Some changes in allele frequencies may have occurred during seed regeneration, maintenance breeding, and possible contamination with seeds or pollen of other samples (Heckenberger et al., <xref ref-type="bibr" rid="B29">2002</xref>; Warburton et al., <xref ref-type="bibr" rid="B81">2010</xref>). These errors can easily be controlled with the development of quality control genotyping methods using a subset of 50 to 100 preselected markers following seed production (Semagn et al., <xref ref-type="bibr" rid="B67">2012a</xref>; Ertiro et al., <xref ref-type="bibr" rid="B22">2015</xref>), which will be addressed in another study.</p>
</sec>
<sec>
<title>Genetic distance and population structure</title>
<p>Genetic distance is a measure of the genetic divergence between pairs of accessions or populations, with pairs that share many alleles having small genetic distance. Results from the present study showed highly variable levels of genetic distances between pairs of <italic>O. glaberrima</italic> accessions, with 1.5% of the pairs nearly identical, 8.0% of the pairs similar, 78.1% of the pairs moderately distant, and 12.4% of the pairs highly distant (Figure <xref ref-type="fig" rid="F1">1</xref>). Our results clearly suggest the presence of a low percentage of redundant accessions-that contribute very little to the observed genetic variation and genetic divergence in the <italic>O. glaberrima</italic> collection maintained by the AfricaRice genebank. Using cluster, principal component, and model-based population structure analyses, we observed five groups or clusters, which are generally consistent with their country of origin and somewhat less so with respect to their adaptation to the different rice growing ecologies (Figures <xref ref-type="fig" rid="F2">2</xref>&#x02013;<xref ref-type="fig" rid="F4">4</xref>, Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>); this classification agrees with previous studies (Semon et al., <xref ref-type="bibr" rid="B72">2005</xref>; Orjuela et al., <xref ref-type="bibr" rid="B55">2014</xref>).</p>
<p>Most accessions from Togo in the present study were collected from the Danyi Plateau and clustered with some Nigerian accessions in the second group. Despite the availability in Togo of improved rice varieties, farmers on the Danyi Plateau in the Togo Hills still cultivate solely <italic>O. glaberrima</italic> landraces because of good grain quality and palatability as well as better adaptation to soil with low fertility and high acidity (Mokuwa et al., <xref ref-type="bibr" rid="B48">2014</xref>). These landraces produce heavier and larger seeds, which germinate better and produce more vigorous seedlings with deeper initial root system than smaller seeds (Roy et al., <xref ref-type="bibr" rid="B64">1996</xref>). The high genetic divergence of the <italic>O. glaberrima</italic> accessions from Togo compared with all other countries, except Ghana, is evident from the <italic>F</italic><sub>ST</sub> values presented in Supplementary Table <xref ref-type="supplementary-material" rid="SM3">S3</xref> and neighbor-joining tree constructed using the pairwise <italic>F</italic><sub>ST</sub> values (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S6</xref>). Why some Nigerian accessions clustered with these divergent accessions from Togo, however, is unclear, but seed is easily traded and the two countries are not so distant. The clustering of accessions from these countries in to the same group may thus reflect historical trade routes.</p>
<p>Isolation by distance (Wright, <xref ref-type="bibr" rid="B82">1943</xref>) refers to a decline in gene flow with an increase in geographical distance between pairs of populations. In such cases, pairs of accessions or populations sampled in close geographic proximity to each other are expected to be less genetically divergent (more genetically similar) than those that are geographically far away from each other. While most accessions in the current study were more similar within countries (Figures <xref ref-type="fig" rid="F2">2</xref>&#x02013;<xref ref-type="fig" rid="F4">4</xref>), there were several divergent pairs of accessions within the same countries, and thus less evidence for isolation by distance in the <italic>O. glaberrima</italic> germplasm used in the present study. This is in contrast to a previous study (Semon et al., <xref ref-type="bibr" rid="B72">2005</xref>), and the larger numbers of accessions in the current study may also show evidence of migration via trade (which negates the decline in gene flow caused by distance). Most farmers in Africa trade seeds at nearby markets and with friends and relatives; this trade can cross country borders as can seed sold by regional seed traders. This may be particularly apparent in the fifth group that consisted of mixed accessions from multiple countries. Overall, pairwise <italic>F</italic><sub>ST</sub> values showed less differentiation between accessions from neighboring countries, with the exception of Gambia, which clustered closer to countries much further east (Supplementary Figure <xref ref-type="supplementary-material" rid="SM5">S6</xref>), possibly evidence of longer distance trade.</p>
<p>Knowledge of population structure is important for different purposes, including understanding the relative effect of evolutionary processes of migration/gene flow, mating system, selection, adaptation, and genetic drift on populations (including breeding populations) (Meirmans, <xref ref-type="bibr" rid="B46">2012</xref>). Human activities significantly affect the dynamics of genetic differentiation in different ways, including changing the dynamics of gene flow, genetic drift and selection (Barnaud et al., <xref ref-type="bibr" rid="B4">2008</xref>). AMOVA partitioned more of the molecular variation into groups (populations) based on country of origin (18.1%) than based on growing environment ecology (10.8%), indicating that migration (aided by humans) is a stronger (or faster acting) force on population structure than is selection for adaptation, drift, or mutation. The <italic>O. glaberrima</italic> germplasm used in the current study has not been selected for specific ecological adaptation, which may possibly be a reason for the lower observed genetic differentiation among ecologies than countries of origin. The proportion of molecular variation attributable among groups predicted from the cluster and model-based STRUCTURE was higher (27.3&#x02013;28.9%) than among countries and ecologies. Therefore, there was more genetic divergence among the predicted groups that was not fully explained by geographical proximity or ecology. The development of core and mini-core collections and selection of parental lines for breeding programs need to consider such genetic divergence.</p>
</sec>
<sec>
<title>Core and mini-core selection</title>
<p>The creation of core and mini-core germplasm collections that represent the maximum possible genetic diversity contained in the whole collection of a given species with a minimum of redundancy (Brown, <xref ref-type="bibr" rid="B9">1989</xref>) is an efficient way to identify suitable variation for breeding and other purposes. A core collection can be created using various methods (Odong et al., <xref ref-type="bibr" rid="B54">2013</xref>), including the random and stratified sampling methods that require subgroups created based on <italic>a priori</italic> knowledge (Brown, <xref ref-type="bibr" rid="B9">1989</xref>); the maximization of the allelic diversity/richness method using MSTRAT (Gouesnard et al., <xref ref-type="bibr" rid="B28">2001</xref>), Core Hunter (Thachuk et al., <xref ref-type="bibr" rid="B77">2009</xref>; Beukelaer et al., <xref ref-type="bibr" rid="B7">2012</xref>) and principal component scoring (Noirot et al., <xref ref-type="bibr" rid="B53">1996</xref>); and the distance-based methods, such as Core Hunter, MLST (Perrier et al., <xref ref-type="bibr" rid="B58">2003</xref>), and PowerCore (Kim et al., <xref ref-type="bibr" rid="B36">2007</xref>). The choice of appropriate method depends on several criteria, including the purpose of the study (e.g., to capture most variation as much as possible in small accessions as possible vs. to optimize the chance of finding new alleles) (Odong et al., <xref ref-type="bibr" rid="B54">2013</xref>), the computational speed of the method, and the need for <italic>a priori</italic> information (e.g., preselected markers, defined subgroups and/or sample size). In the maximization strategy, the main objective is to preserve the highest number of alleles, which is ideal for germplasm conservation, while the distance-based methods primarily aim to maintain most combinations of alleles in specific genotypes (maximize the combination of allelic diversity at the genome level), which is appropriate in breeding (Leroy et al., <xref ref-type="bibr" rid="B39">2014</xref>). The distance-based methods have been strongly recommend for creating core collection, because they allow the simultaneous evaluation of all variables describing accessions, and also provide interpretable criteria/statistical support as compared with other methods (Odong et al., <xref ref-type="bibr" rid="B54">2013</xref>). MLST has multiple advantages over other methods. First, it uses all markers simultaneously through a measure of dissimilarity instead of preselected subset of markers/alleles. Second, it considers the population structure in the data from the phylogenetic tree. Third, it requires neither <italic>a priori</italic> predefined subgroups nor <italic>a priori</italic> fixed sample size. Finally, it provides detailed statistical support indicators for users to choose an optimal core or mini-core sample size. MLST has been used in creating core collection in diverse species, including <italic>Prunus avium</italic> (Campoy et al., <xref ref-type="bibr" rid="B10">2016</xref>), <italic>Vigna unguiculata</italic> (Egbadzor et al., <xref ref-type="bibr" rid="B18">2014</xref>), <italic>Coffea canephora</italic> (Leroy et al., <xref ref-type="bibr" rid="B39">2014</xref>), and <italic>Olea europaea</italic> (El Bakkali et al., <xref ref-type="bibr" rid="B20">2013</xref>). Using MLST, we propose 1,330 and 350 <italic>O. glaberrima</italic> accessions to represent a core and mini-core collection, respectively (Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>). Core and mini-core sets can be developed using geographical origin, phenotypic traits, and biochemical and genetic markers; however, use of genetic distance computed from high density molecular markers from next generation sequencing technology is a promising method (Pessoa-Filho et al., <xref ref-type="bibr" rid="B59">2010</xref>). The ability to measure sequence variation across the entire genome allows core sets to be chosen potentially based on all genes, and the effect of the environment does not influence the selection. If chosen randomly, between 5 and 20% of a core collection captures up to 70% of the genetic diversity observed in the whole collection (Brown, <xref ref-type="bibr" rid="B9">1989</xref>; Van Hintum et al., <xref ref-type="bibr" rid="B79">2000</xref>).</p>
<p>In rice, previously suggested core collections contain from 1% (Chung et al., <xref ref-type="bibr" rid="B13">2009</xref>) to 15% (Liu et al., <xref ref-type="bibr" rid="B42">2015</xref>) of the total number of accessions of the collections they represent. Using 435 alleles scored from 36 microsatellite markers, for example, only 1.4% (98 out of 6,912 accessions) were selected to represent a mini-core set of Indian rice collection conserved at the National Bureau of Plant Genetic Resources, New Delhi, India (Tiwari et al., <xref ref-type="bibr" rid="B78">2015</xref>); the selected mini-core set captured 100% of the total number of alleles. Using 482 alleles from 15 microsatellite markers, only 4% (162 of 4,046 accessions) sampled from the National GeneBank of Rural Development Administration in the Republic of Korea captured 100% of the allelic variation (Zhao et al., <xref ref-type="bibr" rid="B88">2010</xref>). Recently, Egea and colleagues used 14,392 SNPs from DArTseq for genotyping 417 garlic samples (<italic>Allium sativum</italic>), which allowed them in identifying 286 unique samples to represent a core collection (Egea et al., <xref ref-type="bibr" rid="B19">2017</xref>). In barley, Munoz-Amatriain and colleagues recently used 7,842 SNPs to genotype 2,417 accessions sampled from the United States Department of Agriculture (USDA) National Small Grains Collection and created a mini-core set of 186 accessions that captured the majority of the allelic diversity present in the core collection (Munoz-Amatriain et al., <xref ref-type="bibr" rid="B50">2014</xref>). The mini-core collection proposed in the present study is easily manageable for detailed phenotypic evaluation under field and controlled conditions for parent selection in developing new improved rice germplasm for target traits of interest, mining genes and genomic regions associated with target traits of economic importance using genome-wide association studies, and easy for wide germplasm distribution.</p>
</sec>
</sec>
<sec sec-type="conclusions" id="s5">
<title>Conclusions</title>
<p>The present study demonstrated the usefulness of DArTseq in effectively characterizing the genetic variation and population structure of <italic>O. glaberrima</italic> collection conserved at the AfricaRice genebank, and in creating a core and mini-core collections. Overall, <italic>O. glaberrima</italic> showed very low genetic variation, but clear population structure, primarily by countries of origin, and less so by ecology. The mini-core collection accounts &#x0007E;16% of the whole <italic>O. glaberrima</italic> germplasm and represents all countries and ecologies of origin, and all groups predicted based on both cluster and population STRUCTURE analyses, proportionally to the size of each cluster. This mini-core collection will be highly valuable for various purposes, including allele mining and donor parent selection for developing new improved rice germplasm for target traits of interest.</p>
</sec>
<sec id="s6">
<title>Data availability</title>
<p>All relevant results are included within this article and its additional files. The original DArTseq data are available from the corresponding author on request.</p>
</sec>
<sec id="s7">
<title>Author contributions</title>
<p>MNN conceived, designed, and supervised the experiments, secured funding, and partly drafted the paper; ACG, SBK, DDT, and AGo were responsible for sample preparation, phenotyping, DNA extraction and/or compilation of passport information; KS analyzed the data and wrote most part of the paper; XP contributed to data analysis to create core and mini-core collection; MSo, MSi, and AGh provided valuable suggestions on the paper; MLW contributed to and edited the paper. All authors read and approved the paper.</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
</sec>
</body>
<back>
<ack>
<p>The present study was supported by a grant given to MNN (AfricaRice) from the Global Diversity Crop Trust (GDCT) through the Consultative Group on International Agricultural Research (CGIAR). The authors would like to thank Elisee Dannon, Marie Gouette and Fatondji Blandine for assisting on sample preparation and DNA extraction.</p>
</ack>
<sec sec-type="supplementary-material" id="s8">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2017.01748/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2017.01748/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="TableS1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="TableS2.XLSX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="TableS3.XLSX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="TableS4.XLSX" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="SupplementaryFigures.PDF" id="SM5" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agrama</surname> <given-names>H. A.</given-names></name> <name><surname>WenGui</surname> <given-names>Y.</given-names></name> <name><surname>Lee</surname> <given-names>F.</given-names></name> <name><surname>Fjellstrorn</surname> <given-names>R.</given-names></name> <name><surname>Ming-Hsuan</surname> <given-names>C.</given-names></name> <name><surname>Jia</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Genetic assessment of a mini-core subset developed from the USDA Rice Genebank</article-title>. <source>Crop Sci.</source> <volume>49</volume>, <fpage>1336</fpage>&#x02013;<lpage>1346</lpage>. <pub-id pub-id-type="doi">10.2135/cropsci2008.06.0551</pub-id></citation></ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Al-Beyroutiov&#x000E1;</surname> <given-names>M.</given-names></name> <name><surname>Sabo</surname> <given-names>M.</given-names></name> <name><surname>Sleziak</surname> <given-names>P.</given-names></name> <name><surname>Du&#x00161;insk&#x000FD;</surname> <given-names>R.</given-names></name> <name><surname>Birc&#x000E1;k</surname> <given-names>E.</given-names></name> <name><surname>Hauptvogel</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Evolutionary relationships in the genus <italic>Secale</italic> revealed by DArTseq DNA polymorphism</article-title>. <source>Plant Syst. Evol.</source> <volume>302</volume>, <fpage>1083</fpage>&#x02013;<lpage>1091</lpage>. <pub-id pub-id-type="doi">10.1007/s00606-016-1318-2</pub-id></citation></ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baloch</surname> <given-names>F. S.</given-names></name> <name><surname>Alsaleh</surname> <given-names>A.</given-names></name> <name><surname>Shahid</surname> <given-names>M. Q.</given-names></name> <name><surname>&#x000C7;ift&#x000E7;i</surname> <given-names>V.</given-names></name> <name><surname>S&#x000E1;enz De Miera</surname> <given-names>L. E.</given-names></name> <name><surname>Aasim</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>A whole genome DArTseq and SNP analysis for genetic diversity assessment in durum wheat from central fertile crescent</article-title>. <source>PLoS ONE</source> <volume>12</volume>:<fpage>e0167821</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0167821</pub-id><pub-id pub-id-type="pmid">28099442</pub-id></citation></ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barnaud</surname> <given-names>A.</given-names></name> <name><surname>Trigueros</surname> <given-names>G.</given-names></name> <name><surname>McKey</surname> <given-names>D.</given-names></name> <name><surname>Joly</surname> <given-names>H. I.</given-names></name></person-group> (<year>2008</year>). <article-title>High outcrossing rates in fields with mixed sorghum landraces: how are landraces maintained[quest]</article-title>. <source>Heredity (Edinb).</source> <volume>101</volume>, <fpage>445</fpage>&#x02013;<lpage>452</lpage>. <pub-id pub-id-type="doi">10.1038/hdy.2008.77</pub-id><pub-id pub-id-type="pmid">18685567</pub-id></citation></ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barrett</surname> <given-names>B. A.</given-names></name> <name><surname>Kidwell</surname> <given-names>K. K.</given-names></name></person-group> (<year>1998</year>). <article-title>AFLP-based genetic diversity assessment among wheat cultivars from the Pacific Northwest</article-title>. <source>Crop Sci.</source> <volume>38</volume>, <fpage>1261</fpage>&#x02013;<lpage>1271</lpage>. <pub-id pub-id-type="doi">10.2135/cropsci1998.0011183X003800050025x</pub-id></citation></ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beissinger</surname> <given-names>T. M.</given-names></name> <name><surname>Hirsch</surname> <given-names>C. N.</given-names></name> <name><surname>Sekhon</surname> <given-names>R. S.</given-names></name> <name><surname>Foerster</surname> <given-names>J. M.</given-names></name> <name><surname>Johnson</surname> <given-names>J. M.</given-names></name> <name><surname>Muttoni</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Marker density and read-depth for genotyping populations using genotyping-by-sequencing</article-title>. <source>Genetics</source> <volume>193</volume>, <fpage>1073</fpage>&#x02013;<lpage>1081</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.112.147710</pub-id><pub-id pub-id-type="pmid">23410831</pub-id></citation></ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beukelaer</surname> <given-names>H. D.</given-names></name> <name><surname>Sm&#x000FD;kal</surname> <given-names>P.</given-names></name> <name><surname>Davenport</surname> <given-names>G. F.</given-names></name> <name><surname>Fack</surname> <given-names>V.</given-names></name></person-group> (<year>2012</year>). <article-title>Core Hunter II: fast core subset selection based on multiple genetic diversity measures using Mixed Replica search</article-title>. <source>BMC Bioinform.</source> <volume>13</volume>:<fpage>312</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-13-312</pub-id><pub-id pub-id-type="pmid">23174036</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bradbury</surname> <given-names>P. J.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Kroon</surname> <given-names>D. E.</given-names></name> <name><surname>Casstevens</surname> <given-names>T. M.</given-names></name> <name><surname>Ramdoss</surname> <given-names>Y.</given-names></name> <name><surname>Buckler</surname> <given-names>E. S.</given-names></name></person-group> (<year>2007</year>). <article-title>TASSEL: software for association mapping of complex traits in diverse samples</article-title>. <source>Bioinformatics</source> <volume>23</volume>, <fpage>2633</fpage>&#x02013;<lpage>2635</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btm308</pub-id><pub-id pub-id-type="pmid">17586829</pub-id></citation></ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brown</surname> <given-names>A. H. D.</given-names></name></person-group> (<year>1989</year>). <article-title>Core collections: a practical approach to genetic resources management</article-title>. <source>Genome</source> <volume>31</volume>, <fpage>818</fpage>&#x02013;<lpage>824</lpage>. <pub-id pub-id-type="doi">10.1139/g89-144</pub-id></citation></ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Campoy</surname> <given-names>J. A.</given-names></name> <name><surname>Lerigoleur-Balsemin</surname> <given-names>E.</given-names></name> <name><surname>Christmann</surname> <given-names>H.</given-names></name> <name><surname>Beauvieux</surname> <given-names>R.</given-names></name> <name><surname>Girollet</surname> <given-names>N.</given-names></name> <name><surname>Quero-Garc&#x000ED;a</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Genetic diversity, linkage disequilibrium, population structure and construction of a core collection of <italic>Prunus avium</italic> L. landraces and bred cultivars</article-title>. <source>BMC Plant Biol.</source> <volume>16</volume>:<fpage>49</fpage>. <pub-id pub-id-type="doi">10.1186/s12870-016-0712-9</pub-id><pub-id pub-id-type="pmid">26912051</pub-id></citation></ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Zavala</surname> <given-names>C.</given-names></name> <name><surname>Ortega</surname> <given-names>N.</given-names></name> <name><surname>Petroli</surname> <given-names>C.</given-names></name> <name><surname>Franco</surname> <given-names>J.</given-names></name> <name><surname>Burgue&#x000F1;o</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>The development of quality control genotyping approaches: a case study using elite maize lines</article-title>. <source>PLoS ONE</source> <volume>11</volume>:<fpage>e0157236</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0157236</pub-id><pub-id pub-id-type="pmid">27280295</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Sullivan</surname> <given-names>P. F.</given-names></name></person-group> (<year>2003</year>). <article-title>Single nucleotide polymorphism genotyping: biochemistry, protocol, cost and throughput</article-title>. <source>Pharmacogenom. J.</source> <volume>3</volume>, <fpage>77</fpage>&#x02013;<lpage>96</lpage>. <pub-id pub-id-type="doi">10.1038/sj.tpj.6500167</pub-id><pub-id pub-id-type="pmid">12746733</pub-id></citation></ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chung</surname> <given-names>H. K.</given-names></name> <name><surname>Kim</surname> <given-names>K. W.</given-names></name> <name><surname>Chung</surname> <given-names>J. W.</given-names></name> <name><surname>Lee</surname> <given-names>J. R.</given-names></name> <name><surname>Lee</surname> <given-names>S. Y.</given-names></name> <name><surname>Dixit</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>Development of a core set from a large rice collection using a modified heuristic algorithm to retain maximum diversity</article-title>. <source>J. Integr. Plant Biol.</source> <volume>51</volume>, <fpage>1116</fpage>&#x02013;<lpage>1125</lpage>. <pub-id pub-id-type="doi">10.1111/j.1744-7909.2009.00882.x</pub-id><pub-id pub-id-type="pmid">20021559</pub-id></citation></ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Courtois</surname> <given-names>B.</given-names></name> <name><surname>Audebert</surname> <given-names>A.</given-names></name> <name><surname>Dardou</surname> <given-names>A.</given-names></name> <name><surname>Roques</surname> <given-names>S.</given-names></name> <name><surname>Ghneim-Herrera</surname> <given-names>T.</given-names></name> <name><surname>Droc</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Genome-wide association mapping of root traits in a japonica rice panel</article-title>. <source>PLoS ONE</source> <volume>8</volume>:<fpage>e78037</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0078037</pub-id><pub-id pub-id-type="pmid">24223758</pub-id></citation></ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Crossa</surname> <given-names>J.</given-names></name> <name><surname>Beyene</surname> <given-names>Y.</given-names></name> <name><surname>Kassa</surname> <given-names>S.</given-names></name> <name><surname>Perez</surname> <given-names>P.</given-names></name> <name><surname>Hickey</surname> <given-names>J. M.</given-names></name> <name><surname>Chen</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Genomic prediction in maize breeding populations with genotyping-by-sequencing</article-title>. <source>Genes Genomes Genet.</source> <volume>3</volume>, <fpage>1903</fpage>&#x02013;<lpage>1926</lpage>. <pub-id pub-id-type="doi">10.1534/g3.113.008227</pub-id><pub-id pub-id-type="pmid">24022750</pub-id></citation></ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dram&#x000E9;</surname> <given-names>K. N.</given-names></name> <name><surname>Sanchez</surname> <given-names>I.</given-names></name> <name><surname>Gregorio</surname> <given-names>G.</given-names></name> <name><surname>Ndjiondjop</surname> <given-names>M. N.</given-names></name></person-group> (<year>2011</year>). <article-title>Suitability of a selected set of simple sequence repeats (SSR) markers for multiplexing and rapid molecular characterization of African rice (<italic>Oryza glaberrima</italic> Steud.)</article-title>. <source>Afr. J. Biotechnol.</source> <volume>10</volume>, <fpage>6675</fpage>&#x02013;<lpage>6685</lpage>. <pub-id pub-id-type="doi">10.5897/AJB10.2279</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dos Santos</surname> <given-names>J. P.</given-names></name> <name><surname>Pires</surname> <given-names>L. P.</given-names></name> <name><surname>de Castro Vasconcellos</surname> <given-names>R. C.</given-names></name> <name><surname>Pereira</surname> <given-names>G. S.</given-names></name> <name><surname>Von Pinho</surname> <given-names>R. G.</given-names></name> <name><surname>Balestre</surname> <given-names>M.</given-names></name></person-group> (<year>2016</year>). <article-title>Genomic selection to resistance to <italic>Stenocarpella</italic> maydis in maize lines using DArTseq markers</article-title>. <source>BMC Genet.</source> <volume>17</volume>:<fpage>86</fpage>. <pub-id pub-id-type="doi">10.1186/s12863-016-0392-3</pub-id><pub-id pub-id-type="pmid">27316946</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Egbadzor</surname> <given-names>K. F.</given-names></name> <name><surname>Ofori</surname> <given-names>K.</given-names></name> <name><surname>Yeboah</surname> <given-names>M.</given-names></name> <name><surname>Aboagye</surname> <given-names>L. M.</given-names></name> <name><surname>Opoku-Agyeman</surname> <given-names>M. O.</given-names></name> <name><surname>Danquah</surname> <given-names>E. Y.</given-names></name></person-group> (<year>2014</year>). <article-title>Diversity in 113 cowpea <italic>Vigna</italic> unguiculata (L) walp accessions assessed with 458 SNP markers</article-title>. <source>Springerplus</source> <volume>3</volume>:<fpage>541</fpage>. <pub-id pub-id-type="doi">10.1186/2193-1801-3-541</pub-id><pub-id pub-id-type="pmid">25332852</pub-id></citation></ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Egea</surname> <given-names>L. A.</given-names></name> <name><surname>M&#x000E9;rida-Garc&#x000ED;a</surname> <given-names>R.</given-names></name> <name><surname>Kilian</surname> <given-names>A.</given-names></name> <name><surname>Hernandez</surname> <given-names>P.</given-names></name> <name><surname>Dorado</surname> <given-names>G.</given-names></name></person-group> (<year>2017</year>). <article-title>Assessment of genetic diversity and structure of large garlic (<italic>Allium sativum</italic>) germplasm bank, by diversity arrays technology &#x0201C;genotyping-by-sequencing&#x0201D; platform (DArTseq)</article-title>. <source>Front. Genet.</source> <volume>8</volume>:<fpage>98</fpage>. <pub-id pub-id-type="doi">10.3389/fgene.2017.00098</pub-id><pub-id pub-id-type="pmid">28775737</pub-id></citation></ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>El Bakkali</surname> <given-names>A.</given-names></name> <name><surname>Haouane</surname> <given-names>H.</given-names></name> <name><surname>Moukhli</surname> <given-names>A.</given-names></name> <name><surname>Costes</surname> <given-names>E.</given-names></name> <name><surname>van Damme</surname> <given-names>P.</given-names></name> <name><surname>Khadari</surname> <given-names>B.</given-names></name></person-group> (<year>2013</year>). <article-title>Construction of core collections suitable for association mapping to optimize use of mediterranean olive (<italic>Olea europaea</italic> l.) genetic resources</article-title>. <source>PLoS ONE</source> <volume>8</volume>:<fpage>e61265</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0061265</pub-id><pub-id pub-id-type="pmid">23667437</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elshire</surname> <given-names>R. J.</given-names></name> <name><surname>Glaubitz</surname> <given-names>J. C.</given-names></name> <name><surname>Sun</surname> <given-names>Q.</given-names></name> <name><surname>Poland</surname> <given-names>J. A.</given-names></name> <name><surname>Kawamoto</surname> <given-names>K.</given-names></name> <name><surname>Buckler</surname> <given-names>E. S.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>A robust, simple genotyping-by-sequencing (GBS) approach for high diversity species</article-title>. <source>PLoS ONE</source> <volume>6</volume>:<fpage>e19379</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0019379</pub-id><pub-id pub-id-type="pmid">21573248</pub-id></citation></ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ertiro</surname> <given-names>B. T.</given-names></name> <name><surname>Ogugo</surname> <given-names>V.</given-names></name> <name><surname>Worku</surname> <given-names>M.</given-names></name> <name><surname>Das</surname> <given-names>B.</given-names></name> <name><surname>Olsen</surname> <given-names>M.</given-names></name> <name><surname>Labuschagne</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Comparison of kompetitive allele specific PCR (KASP) and genotyping by sequencing (GBS) for quality control analysis in maize</article-title>. <source>BMC Genomics</source> <volume>16</volume>:<fpage>908</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-015-2180-2</pub-id><pub-id pub-id-type="pmid">26545737</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Excoffier</surname> <given-names>L.</given-names></name> <name><surname>Lischer</surname> <given-names>H. E.</given-names></name></person-group> (<year>2010</year>). <article-title>Arlequin suite ver 3.5: a new series of programs to perform population genetics analyses under Linux and Windows [electronic resource]</article-title>. <source>Mol. Ecol. Resour.</source> <volume>10</volume>, <fpage>564</fpage>&#x02013;<lpage>567</lpage>. <pub-id pub-id-type="doi">10.1111/j.1755-0998.2010.02847.x</pub-id><pub-id pub-id-type="pmid">21565059</pub-id></citation></ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Excoffier</surname> <given-names>L.</given-names></name> <name><surname>Smouse</surname> <given-names>P. E.</given-names></name> <name><surname>Quattro</surname> <given-names>J. M.</given-names></name></person-group> (<year>1992</year>). <article-title>Analysis of molecular variance inferred from metric distances among DNA haplotypes: application to human mitochondrial DNA restriction data</article-title>. <source>Genetics</source> <volume>131</volume>, <fpage>479</fpage>&#x02013;<lpage>491</lpage>. <pub-id pub-id-type="pmid">1644282</pub-id></citation></ref>
<ref id="B25">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Falconer</surname> <given-names>D. S.</given-names></name> <name><surname>MacKay</surname> <given-names>T. F. C.</given-names></name></person-group> (<year>1996</year>). <source>Introduction to Quantitative Genetics</source>. <publisher-name>Longman Group Limited</publisher-name>.</citation></ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frankham</surname> <given-names>R.</given-names></name></person-group> (<year>2005</year>). <article-title>Genetics and extinction</article-title>. <source>Biol. Conserv.</source> <volume>126</volume>, <fpage>131</fpage>&#x02013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1016/j.biocon.2005.05.002</pub-id></citation></ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Furuta</surname> <given-names>T.</given-names></name> <name><surname>Ashikari</surname> <given-names>M.</given-names></name> <name><surname>Jena</surname> <given-names>K. K.</given-names></name> <name><surname>Doi</surname> <given-names>K.</given-names></name> <name><surname>Reuscher</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>Adapting genotyping-by-sequencing for rice F2 populations</article-title>. <source>Genes Genomes Genet.</source> <volume>7</volume>, <fpage>881</fpage>&#x02013;<lpage>893</lpage>. <pub-id pub-id-type="doi">10.1534/g3.116.038190</pub-id><pub-id pub-id-type="pmid">28082325</pub-id></citation></ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gouesnard</surname> <given-names>B.</given-names></name> <name><surname>Bataillon</surname> <given-names>T. M.</given-names></name> <name><surname>Decoux</surname> <given-names>G.</given-names></name> <name><surname>Rozale</surname> <given-names>C.</given-names></name> <name><surname>Schoen</surname> <given-names>D. J.</given-names></name> <name><surname>David</surname> <given-names>J. L.</given-names></name></person-group> (<year>2001</year>). <article-title>MSTRAT: an algorithm for building germ plasm core collections by maximizing allelic or phenotypic richness</article-title>. <source>J. Heredity</source> <volume>92</volume>, <fpage>93</fpage>&#x02013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1093/jhered/92.1.93</pub-id></citation></ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Heckenberger</surname> <given-names>M.</given-names></name> <name><surname>Bohn</surname> <given-names>M.</given-names></name> <name><surname>Ziegle</surname> <given-names>J. S.</given-names></name> <name><surname>Joe</surname> <given-names>L. K.</given-names></name> <name><surname>Hauser</surname> <given-names>J. D.</given-names></name> <name><surname>Hutton</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2002</year>). <article-title>Variation of DNA fingerprints among accessions within maize inbred lines and implications for identification of essentially derived varieties. I. Genetic and technical sources of variation in SSR data</article-title>. <source>Mol. Breed.</source> <volume>10</volume>, <fpage>181</fpage>&#x02013;<lpage>191</lpage>. <pub-id pub-id-type="doi">10.1023/A:1020539330957</pub-id></citation></ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holsinger</surname> <given-names>K. E.</given-names></name> <name><surname>Weir</surname> <given-names>B. S.</given-names></name></person-group> (<year>2009</year>). <article-title>Genetics in geographically structured populations: defining, estimating and interpreting FST</article-title>. <source>Nat. Rev. Genet.</source> <volume>10</volume>, <fpage>639</fpage>&#x02013;<lpage>650</lpage>. <pub-id pub-id-type="doi">10.1038/nrg2611</pub-id></citation></ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Kurata</surname> <given-names>N.</given-names></name> <name><surname>Wei</surname> <given-names>X.</given-names></name> <name><surname>Wang</surname> <given-names>Z. X.</given-names></name> <name><surname>Wang</surname> <given-names>A.</given-names></name> <name><surname>Zhao</surname> <given-names>Q.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>A map of rice genome variation reveals the origin of cultivated rice</article-title>. <source>Nature</source> <volume>490</volume>, <fpage>497</fpage>&#x02013;<lpage>501</lpage>. <pub-id pub-id-type="doi">10.1038/nature11532</pub-id><pub-id pub-id-type="pmid">23034647</pub-id></citation></ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ishii</surname> <given-names>T.</given-names></name> <name><surname>Xu</surname> <given-names>Y.</given-names></name> <name><surname>McCouch</surname> <given-names>S. R.</given-names></name></person-group> (<year>2001</year>). <article-title>Nuclear- and chloroplast-microsatellite variation in a-genome species of rice</article-title>. <source>Genome</source> <volume>44</volume>, <fpage>658</fpage>&#x02013;<lpage>666</lpage>. <pub-id pub-id-type="doi">10.1139/g01-044</pub-id><pub-id pub-id-type="pmid">11550902</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>M. P.</given-names></name> <name><surname>Dingkuhn</surname> <given-names>M.</given-names></name> <name><surname>Aluko/snm</surname> <given-names>G. K.</given-names></name> <name><surname>Semon</surname> <given-names>M.</given-names></name></person-group> (<year>1997</year>). <article-title>Interspecific <italic>Oryza sativa</italic> L. <italic>x O. glaberrima</italic> Steud. progenies in upland rice improvement</article-title>. <source>Euphytica</source> <volume>94</volume>, <fpage>237</fpage>&#x02013;<lpage>246</lpage>. <pub-id pub-id-type="doi">10.1023/A:1002969932224</pub-id></citation></ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Joshi</surname> <given-names>S. P.</given-names></name> <name><surname>Gupta</surname> <given-names>V. S.</given-names></name> <name><surname>Aggarwal</surname> <given-names>R. K.</given-names></name> <name><surname>Ranjekar</surname> <given-names>P. K.</given-names></name> <name><surname>Brar</surname> <given-names>D. S.</given-names></name></person-group> (<year>2000</year>). <article-title>Genetic diversity and phylogenetic relationship as revealed by inter simple sequence repeat (ISSR) polymorphism in the genus <italic>Oryza</italic></article-title>. <source>Theor. Appl. Genet.</source> <volume>100</volume>, <fpage>1311</fpage>&#x02013;<lpage>1320</lpage>. <pub-id pub-id-type="doi">10.1007/s001220051440</pub-id></citation></ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kilian</surname> <given-names>A.</given-names></name> <name><surname>Sanewski</surname> <given-names>G.</given-names></name> <name><surname>Ko</surname> <given-names>L.</given-names></name></person-group> (<year>2016</year>). <article-title>The application of DArTseq technology to pineapple</article-title>. <source>Acta Hortic.</source> <volume>1111</volume>, <fpage>181</fpage>&#x02013;<lpage>188</lpage>. <pub-id pub-id-type="doi">10.17660/ActaHortic.2016.1111.27</pub-id></citation></ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>K. W.</given-names></name> <name><surname>Chung</surname> <given-names>H. K.</given-names></name> <name><surname>Cho</surname> <given-names>G. T.</given-names></name> <name><surname>Ma</surname> <given-names>K. H.</given-names></name> <name><surname>Chandrabalan</surname> <given-names>D.</given-names></name> <name><surname>Gwag</surname> <given-names>J. G.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>PowerCore: a program applying the advanced M strategy with a heuristic search for establishing core sets</article-title>. <source>Bioinformatics</source> <volume>23</volume>, <fpage>2155</fpage>&#x02013;<lpage>2162</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btm313</pub-id><pub-id pub-id-type="pmid">17586551</pub-id></citation></ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kwon</surname> <given-names>S. J.</given-names></name> <name><surname>Lee</surname> <given-names>J. K.</given-names></name> <name><surname>Hong</surname> <given-names>S. W.</given-names></name> <name><surname>Park</surname> <given-names>Y. J.</given-names></name> <name><surname>McNally</surname> <given-names>K. L.</given-names></name> <name><surname>Kim</surname> <given-names>N. S.</given-names></name></person-group> (<year>2006</year>). <article-title>Genetic diversity and phylogenetic relationship in AA <italic>Oryza</italic> species as revealed by Rim2/Hipa CACTA transposon display</article-title>. <source>Genes Genet. Syst.</source> <volume>81</volume>, <fpage>93</fpage>&#x02013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1266/ggs.81.93</pub-id><pub-id pub-id-type="pmid">16755133</pub-id></citation></ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lam</surname> <given-names>H. M.</given-names></name> <name><surname>Xu</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>W.</given-names></name> <name><surname>Yang</surname> <given-names>G.</given-names></name> <name><surname>Wong</surname> <given-names>F.-L.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Resequencing of 31 wild and cultivated soybean genomes identifies patterns of genetic diversity and selection</article-title>. <source>Nat. Genet.</source> <volume>42</volume>, <fpage>1053</fpage>&#x02013;<lpage>1059</lpage>. <pub-id pub-id-type="doi">10.1038/ng.715</pub-id><pub-id pub-id-type="pmid">21076406</pub-id></citation></ref>
<ref id="B39">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leroy</surname> <given-names>T.</given-names></name> <name><surname>De Bellis</surname> <given-names>F.</given-names></name> <name><surname>Legnate</surname> <given-names>H.</given-names></name> <name><surname>Musoli</surname> <given-names>P.</given-names></name> <name><surname>Kalonji</surname> <given-names>A.</given-names></name> <name><surname>Loor Sol&#x000F3;rzano</surname> <given-names>R. G.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Developing core collections to optimize the management and the exploitation of diversity of the coffee <italic>Coffea</italic> canephora</article-title>. <source>Genetica</source> <volume>142</volume>, <fpage>185</fpage>&#x02013;<lpage>199</lpage>. <pub-id pub-id-type="doi">10.1007/s10709-014-9766-5</pub-id><pub-id pub-id-type="pmid">24792040</pub-id></citation></ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Z. M.</given-names></name> <name><surname>Zheng</surname> <given-names>X. M.</given-names></name> <name><surname>Ge</surname> <given-names>S.</given-names></name></person-group> (<year>2011</year>). <article-title>Genetic diversity and domestication history of African rice (<italic>Oryza glaberrima</italic>) as inferred from multiple gene sequences</article-title>. <source>Theor. Appl. Genet.</source> <volume>123</volume>, <fpage>21</fpage>&#x02013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-011-1563-2</pub-id><pub-id pub-id-type="pmid">21400109</pub-id></citation></ref>
<ref id="B41">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>K.</given-names></name> <name><surname>Muse</surname> <given-names>S. V.</given-names></name></person-group> (<year>2005</year>). <article-title>PowerMarker: an integrated analysis environment for genetic marker analysis</article-title>. <source>Bioinformatics</source> <volume>21</volume>, <fpage>2128</fpage>&#x02013;<lpage>2129</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bti282</pub-id><pub-id pub-id-type="pmid">15705655</pub-id></citation></ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>W.</given-names></name> <name><surname>Shahid</surname> <given-names>M. Q.</given-names></name> <name><surname>Bai</surname> <given-names>L.</given-names></name> <name><surname>Lu</surname> <given-names>Z.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Jiang</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Evaluation of genetic diversity and development of a core collection of wild rice (<italic>Oryza rufipogon</italic> Griff.) populations in China</article-title>. <source>PLoS ONE</source> <volume>10</volume>:<fpage>e0145990</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0145990</pub-id><pub-id pub-id-type="pmid">26720755</pub-id></citation></ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luan</surname> <given-names>S.</given-names></name> <name><surname>Chiang</surname> <given-names>T. Y.</given-names></name> <name><surname>Gong</surname> <given-names>X. U. N.</given-names></name></person-group> (<year>2006</year>). <article-title>High genetic diversity vs. low genetic differentiation in nouelia insignis (Asteraceae), a narrowly distributed and endemic species in China, revealed by ISSR fingerprinting</article-title>. <source>Ann. Bot.</source> <volume>98</volume>, <fpage>583</fpage>&#x02013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1093/aob/mcl129</pub-id><pub-id pub-id-type="pmid">16807255</pub-id></citation></ref>
<ref id="B44">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Maclean</surname> <given-names>J. L.</given-names></name> <name><surname>Dawe</surname> <given-names>D. C.</given-names></name> <name><surname>Hardy</surname> <given-names>B.</given-names></name> <name><surname>Hettel</surname> <given-names>G. P.</given-names></name></person-group> (<year>2002</year>). <source>Rice Almanac</source>. <publisher-loc>Los Banos, CA</publisher-loc>: <publisher-name>CABI Publishing</publisher-name>.</citation></ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McCouch</surname> <given-names>S. R.</given-names></name> <name><surname>McNally</surname> <given-names>K. L.</given-names></name> <name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Sackville Hamilton</surname> <given-names>R.</given-names></name></person-group> (<year>2012</year>). <article-title>Genomics of genebanks: a case study in rice</article-title>. <source>Am. J. Bot.</source> <volume>99</volume>, <fpage>407</fpage>&#x02013;<lpage>423</lpage>. <pub-id pub-id-type="doi">10.3732/ajb.1100385</pub-id></citation></ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meirmans</surname> <given-names>P. G.</given-names></name></person-group> (<year>2012</year>). <article-title>AMOVA-based clustering of population genetic data</article-title>. <source>J. Hered.</source> <volume>103</volume>, <fpage>744</fpage>&#x02013;<lpage>750</lpage>. <pub-id pub-id-type="doi">10.1093/jhered/ess047</pub-id><pub-id pub-id-type="pmid">22896561</pub-id></citation></ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meyer</surname> <given-names>R. S.</given-names></name> <name><surname>Choi</surname> <given-names>J. Y.</given-names></name> <name><surname>Sanches</surname> <given-names>M.</given-names></name> <name><surname>Plessis</surname> <given-names>A.</given-names></name> <name><surname>Flowers</surname> <given-names>J. M.</given-names></name> <name><surname>Amas</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Domestication history and geographical adaptation inferred from a SNP map of African rice</article-title>. <source>Nat. Genet.</source> <volume>48</volume>, <fpage>1083</fpage>&#x02013;<lpage>1088</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3633</pub-id><pub-id pub-id-type="pmid">27500524</pub-id></citation></ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mokuwa</surname> <given-names>A.</given-names></name> <name><surname>Nuijten</surname> <given-names>E.</given-names></name> <name><surname>Okry</surname> <given-names>F.</given-names></name> <name><surname>Teeken</surname> <given-names>B.</given-names></name> <name><surname>Maat</surname> <given-names>H.</given-names></name> <name><surname>Richards</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Processes underpinning development and maintenance of diversity in rice in West Africa: evidence from combining morphological and molecular markers</article-title>. <source>PLoS ONE</source> <volume>9</volume>:<fpage>e85953</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0085953</pub-id><pub-id pub-id-type="pmid">24465809</pub-id></citation></ref>
<ref id="B49">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Montcho</surname> <given-names>D.</given-names></name> <name><surname>Futakuchi</surname> <given-names>K.</given-names></name> <name><surname>Agbangla</surname> <given-names>C.</given-names></name> <name><surname>Semon</surname> <given-names>M.</given-names></name> <name><surname>Dieng</surname> <given-names>I.</given-names></name> <name><surname>Sie</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Morphological and phenological response of African rice (<italic>Oryza glaberrima</italic> steud.) under different hydrological conditions</article-title>. <source>Asian J. Plant Sci.</source> <volume>12</volume>, <fpage>79</fpage>&#x02013;<lpage>86</lpage>. <pub-id pub-id-type="doi">10.3923/ajps.2013.79.86</pub-id></citation></ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Munoz-Amatriain</surname> <given-names>M.</given-names></name> <name><surname>Cuesta-Marcos</surname> <given-names>A.</given-names></name> <name><surname>Endelman</surname> <given-names>J. B.</given-names></name> <name><surname>Comadran</surname> <given-names>J.</given-names></name> <name><surname>Bonman</surname> <given-names>J. M.</given-names></name> <name><surname>Bockelman</surname> <given-names>H. E.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>The USDA barley core collection: genetic diversity, population structure, and potential for genome-wide association studies</article-title>. <source>PLoS ONE</source> <volume>9</volume>:<fpage>e94688</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0094688</pub-id><pub-id pub-id-type="pmid">24732668</pub-id></citation></ref>
<ref id="B51">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Murray</surname> <given-names>M. G.</given-names></name> <name><surname>Thompson</surname> <given-names>W. F.</given-names></name></person-group> (<year>1980</year>). <article-title>Rapid isolation of high molecular weight plant DNA</article-title>. <source>Nucleic Acids Res</source> <volume>8</volume>, <fpage>4321</fpage>&#x02013;<lpage>4325</lpage>. <pub-id pub-id-type="doi">10.1093/nar/8.19.4321</pub-id><pub-id pub-id-type="pmid">7433111</pub-id></citation></ref>
<ref id="B52">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nazzicari</surname> <given-names>N.</given-names></name> <name><surname>Biscarini</surname> <given-names>F.</given-names></name> <name><surname>Cozzi</surname> <given-names>P.</given-names></name> <name><surname>Brummer</surname> <given-names>E. C.</given-names></name> <name><surname>Annicchiarico</surname> <given-names>P.</given-names></name></person-group> (<year>2016</year>). <article-title>Marker imputation efficiency for genotyping-by-sequencing data in rice (<italic>Oryza sativa</italic>) and alfalfa (<italic>Medicago sativa</italic>)</article-title>. <source>Mol. Breed</source>. <volume>36</volume>, <fpage>69</fpage>. <pub-id pub-id-type="doi">10.1007/s11032-016-0490-y</pub-id></citation></ref>
<ref id="B53">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Noirot</surname> <given-names>M.</given-names></name> <name><surname>Hamon</surname> <given-names>S.</given-names></name> <name><surname>Anthony</surname> <given-names>F.</given-names></name></person-group> (<year>1996</year>). <article-title>The principal component scoring: a new method of constituting a core collection using quantitative data</article-title>. <source>Genet. Resour. Crop. Evol.</source> <volume>43</volume>, <fpage>1</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1007/BF00126934</pub-id></citation></ref>
<ref id="B54">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Odong</surname> <given-names>T. L.</given-names></name> <name><surname>Jansen</surname> <given-names>J.</given-names></name> <name><surname>van Eeuwijk</surname> <given-names>F. A.</given-names></name> <name><surname>van Hintum</surname> <given-names>T. J. L.</given-names></name></person-group> (<year>2013</year>). <article-title>Quality of core collections for effective utilisation of genetic resources review, discussion and interpretation</article-title>. <source>Theor. Appl. Genet.</source> <volume>126</volume>, <fpage>289</fpage>&#x02013;<lpage>305</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-012-1971-y</pub-id><pub-id pub-id-type="pmid">22983567</pub-id></citation></ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Orjuela</surname> <given-names>J.</given-names></name> <name><surname>Sabot</surname> <given-names>F.</given-names></name> <name><surname>Ch&#x000E9;ron</surname> <given-names>S.</given-names></name> <name><surname>Vigouroux</surname> <given-names>Y.</given-names></name> <name><surname>Adam</surname> <given-names>H.</given-names></name> <name><surname>Chrestin</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>An extensive analysis of the African rice genetic diversity through a global genotyping</article-title>. <source>Theor. Appl. Genet.</source> <volume>127</volume>, <fpage>2211</fpage>&#x02013;<lpage>2223</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-014-2374-z</pub-id><pub-id pub-id-type="pmid">25119871</pub-id></citation></ref>
<ref id="B56">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ouborg</surname> <given-names>N. J.</given-names></name> <name><surname>Piquot</surname> <given-names>Y.</given-names></name> <name><surname>Groenendael</surname> <given-names>J. M.</given-names></name></person-group> (<year>1999</year>). <article-title>Population genetics, molecular markers and the study of dispersal in plants</article-title>. <source>J. Ecol.</source> <volume>87</volume>, <fpage>551</fpage>&#x02013;<lpage>568</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-2745.1999.00389.x</pub-id></citation></ref>
<ref id="B57">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Park</surname> <given-names>K. C.</given-names></name> <name><surname>Kim</surname> <given-names>N. H.</given-names></name> <name><surname>Cho</surname> <given-names>Y. S.</given-names></name> <name><surname>Kang</surname> <given-names>K. H.</given-names></name> <name><surname>Lee</surname> <given-names>J. K.</given-names></name> <name><surname>Kim</surname> <given-names>N. S.</given-names></name></person-group> (<year>2003</year>). <article-title>Genetic variations of AA genome <italic>Oryza</italic> species measured by MITE-AFLP</article-title>. <source>Theor. Appl. Genet.</source> <volume>107</volume>, <fpage>203</fpage>&#x02013;<lpage>209</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-003-1252-x</pub-id><pub-id pub-id-type="pmid">12845436</pub-id></citation></ref>
<ref id="B58">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Perrier</surname> <given-names>X.</given-names></name> <name><surname>Flori</surname> <given-names>A.</given-names></name> <name><surname>Bonnot</surname> <given-names>F.</given-names></name></person-group> (<year>2003</year>). <article-title>Data analysis methods</article-title>, in <source>Genetic Diversity of Cultivated Tropical Plants</source>, eds <person-group person-group-type="author"><name><surname>Hamon</surname> <given-names>P.</given-names></name> <name><surname>Seguin</surname> <given-names>M.</given-names></name> <name><surname>Perrier</surname> <given-names>X.</given-names></name> <name><surname>Glaszmann</surname> <given-names>J. C. E.</given-names></name></person-group> (<publisher-loc>Montpellier</publisher-loc>: <publisher-name>Enfield Science Publishers</publisher-name>), <fpage>43</fpage>&#x02013;<lpage>76</lpage>.</citation></ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pessoa-Filho</surname> <given-names>M.</given-names></name> <name><surname>Rangel</surname> <given-names>P. H. N.</given-names></name> <name><surname>Ferreira</surname> <given-names>M. E.</given-names></name></person-group> (<year>2010</year>). <article-title>Extracting samples of high diversity from thematic collections of large genebanks using a genetic-distance based approach</article-title>. <source>BMC Plant Biol.</source> <volume>10</volume>:<fpage>127</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2229-10-127</pub-id></citation></ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pritchard</surname> <given-names>J. K.</given-names></name> <name><surname>Stephens</surname> <given-names>M.</given-names></name> <name><surname>Donnelly</surname> <given-names>P.</given-names></name></person-group> (<year>2000</year>). <article-title>Inference of population structure using multilocus genotype data</article-title>. <source>Genetics</source> <volume>155</volume>, <fpage>945</fpage>&#x02013;<lpage>959</lpage>. <pub-id pub-id-type="pmid">10835412</pub-id></citation></ref>
<ref id="B61">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rafalski</surname> <given-names>A.</given-names></name></person-group> (<year>2002</year>). <article-title>Applications of single nucleotide polymorphisms in crop genetics</article-title>. <source>Curr. Opin. Plant Biol.</source> <volume>5</volume>, <fpage>94</fpage>&#x02013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1016/S1369-5266(02)00240-6</pub-id><pub-id pub-id-type="pmid">11856602</pub-id></citation></ref>
<ref id="B62">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reif</surname> <given-names>J. C.</given-names></name> <name><surname>Zhang</surname> <given-names>P.</given-names></name> <name><surname>Dreisigacker</surname> <given-names>S.</given-names></name> <name><surname>Warburton</surname> <given-names>M. L.</given-names></name> <name><surname>van Ginkel</surname> <given-names>M.</given-names></name> <name><surname>Hoisington</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2005</year>). <article-title>Wheat genetic diversity trends during domestication and breeding</article-title>. <source>Theor. Appl. Genet.</source> <volume>110</volume>, <fpage>859</fpage>&#x02013;<lpage>864</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-004-1881-8</pub-id><pub-id pub-id-type="pmid">15690175</pub-id></citation></ref>
<ref id="B63">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ren</surname> <given-names>R.</given-names></name> <name><surname>Ray</surname> <given-names>R.</given-names></name> <name><surname>Li</surname> <given-names>P.</given-names></name> <name><surname>Xu</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>M.</given-names></name> <name><surname>Liu</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Construction of a high-density DArTseq SNP-based genetic map and identification of genomic regions with segregation distortion in a genetic population derived from a cross between feral and cultivated-type watermelon</article-title>. <source>Mol. Genet. Genomics</source> <volume>290</volume>, <fpage>1457</fpage>&#x02013;<lpage>1470</lpage>. <pub-id pub-id-type="doi">10.1007/s00438-015-0997-7</pub-id><pub-id pub-id-type="pmid">25702268</pub-id></citation></ref>
<ref id="B64">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roy</surname> <given-names>S. K. S.</given-names></name> <name><surname>Hamid</surname> <given-names>A.</given-names></name> <name><surname>Miah</surname> <given-names>M. G.</given-names></name> <name><surname>Hashem</surname> <given-names>A.</given-names></name></person-group> (<year>1996</year>). <article-title>Seed size variation and its effects on germination and seedling vigour in rice</article-title>. <source>J. Agron. Crop. Sci.</source> <volume>176</volume>, <fpage>79</fpage>&#x02013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1111/j.1439-037X.1996.tb00449.x</pub-id></citation></ref>
<ref id="B65">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sansaloni</surname> <given-names>C.</given-names></name> <name><surname>Petroli</surname> <given-names>C.</given-names></name> <name><surname>Jaccoud</surname> <given-names>D.</given-names></name> <name><surname>Carling</surname> <given-names>J.</given-names></name> <name><surname>Detering</surname> <given-names>F.</given-names></name> <name><surname>Grattapaglia</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Diversity Arrays Technology (DArT) and next-generation sequencing combined: genome-wide, high throughput, highly informative genotyping for molecular breeding of <italic>Eucalyptus</italic></article-title>. <source>BMC Proc.</source> <volume>5</volume>:<fpage>P54</fpage>. <pub-id pub-id-type="doi">10.1186/1753-6561-5-S7-P54</pub-id></citation></ref>
<ref id="B66">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schlotterer</surname> <given-names>C.</given-names></name></person-group> (<year>2004</year>). <article-title>The evolution of molecular markers - just a matter of fashion?</article-title> <source>Nat. Rev. Genet.</source> <volume>5</volume>, <fpage>63</fpage>&#x02013;<lpage>69</lpage>. <pub-id pub-id-type="doi">10.1038/nrg1249</pub-id><pub-id pub-id-type="pmid">14666112</pub-id></citation></ref>
<ref id="B67">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Semagn</surname> <given-names>K.</given-names></name> <name><surname>Beyene</surname> <given-names>Y.</given-names></name> <name><surname>Makumbi</surname> <given-names>D.</given-names></name> <name><surname>Mugo</surname> <given-names>S.</given-names></name> <name><surname>Prasanna</surname> <given-names>B. M.</given-names></name> <name><surname>Magorokosho</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2012a</year>). <article-title>Quality control genotyping for assessment of genetic identity and purity in diverse tropical maize inbred lines</article-title>. <source>Theor. Appl. Genet.</source> <volume>125</volume>, <fpage>1487</fpage>&#x02013;<lpage>1501</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-012-1928-1</pub-id><pub-id pub-id-type="pmid">22801872</pub-id></citation></ref>
<ref id="B68">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Semagn</surname> <given-names>K.</given-names></name> <name><surname>Beyene</surname> <given-names>Y.</given-names></name> <name><surname>Raman</surname> <given-names>B.</given-names></name> <name><surname>Sudha</surname> <given-names>N.</given-names></name> <name><surname>Gowda</surname> <given-names>M.</given-names></name> <name><surname>Biswanath</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Quantitative trait loci mapping and molecular breeding for developing stress resilient maize for sub-Saharan Africa</article-title>. <source>Crop Sci.</source> <volume>55</volume>, <fpage>1449</fpage>&#x02013;<lpage>1459</lpage>. <pub-id pub-id-type="doi">10.2135/cropsci2014.09.0646</pub-id></citation></ref>
<ref id="B69">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Semagn</surname> <given-names>K.</given-names></name> <name><surname>Bjornstad</surname> <given-names>A.</given-names></name> <name><surname>Ndjiondjop</surname> <given-names>M. N.</given-names></name></person-group> (<year>2006</year>). <article-title>An overview of molecular marker methods for plants</article-title>. <source>Afr. J. Biotechnol.</source> <volume>5</volume>, <fpage>2540</fpage>&#x02013;<lpage>2568</lpage>.</citation></ref>
<ref id="B70">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Semagn</surname> <given-names>K.</given-names></name> <name><surname>Magorokosho</surname> <given-names>C.</given-names></name> <name><surname>Ogugo</surname> <given-names>V.</given-names></name> <name><surname>Makumbi</surname> <given-names>D.</given-names></name> <name><surname>Warburton</surname> <given-names>M.</given-names></name></person-group> (<year>2014</year>). <article-title>Genetic relationships and structure among open-pollinated maize varieties adapted to eastern and southern Africa using microsatellite markers</article-title>. <source>Mol. Breed.</source> <volume>34</volume>, <fpage>1423</fpage>&#x02013;<lpage>1435</lpage>. <pub-id pub-id-type="doi">10.1007/s11032-014-0126-z</pub-id></citation></ref>
<ref id="B71">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Semagn</surname> <given-names>K.</given-names></name> <name><surname>Magorokosho</surname> <given-names>C.</given-names></name> <name><surname>Vivek</surname> <given-names>B. S.</given-names></name> <name><surname>Makumbi</surname> <given-names>D.</given-names></name> <name><surname>Beyene</surname> <given-names>Y.</given-names></name> <name><surname>Mugo</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2012b</year>). <article-title>Molecular characterization of diverse CIMMYT maize inbred lines from eastern and southern Africa using single nucleotide polymorphic markers</article-title>. <source>BMC Genomics</source> <volume>13</volume>:<fpage>113</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-13-113</pub-id><pub-id pub-id-type="pmid">22443094</pub-id></citation></ref>
<ref id="B72">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Semon</surname> <given-names>M.</given-names></name> <name><surname>Nielsen</surname> <given-names>R.</given-names></name> <name><surname>Jones</surname> <given-names>M. P.</given-names></name> <name><surname>McCouch</surname> <given-names>S. R.</given-names></name></person-group> (<year>2005</year>). <article-title>The population structure of African cultivated rice <italic>Oryza glaberrima</italic> (Steud.): evidence for elevated levels of linkage disequilibrium caused by admixture with <italic>O. sativa</italic> and ecological adaptation</article-title>. <source>Genetics</source> <volume>169</volume>, <fpage>1639</fpage>&#x02013;<lpage>1647</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.104.033175</pub-id><pub-id pub-id-type="pmid">15545652</pub-id></citation></ref>
<ref id="B73">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>P. K.</given-names></name></person-group> (<year>2017</year>). <article-title>Molecular markers: mini review</article-title>. <source>Plant Cell Biotechnol. Mol. Biol.</source> <volume>18</volume>, <fpage>181</fpage>&#x02013;<lpage>189</lpage>.</citation></ref>
<ref id="B74">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Swarts</surname> <given-names>K.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Alberto Romero Navarro</surname> <given-names>J.</given-names></name> <name><surname>An</surname> <given-names>D.</given-names></name> <name><surname>Romay</surname> <given-names>M. C.</given-names></name> <name><surname>Hearne</surname> <given-names>S.</given-names></name></person-group> (<year>2014</year>). <article-title>Novel methods to optimize genotypic imputation for low-coverage, next-generation sequence data in crop plants</article-title>. <source>Plant Genome</source> <volume>7</volume>, <fpage>1</fpage>&#x02013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.3835/plantgenome2014.05.0023</pub-id></citation></ref>
<ref id="B75">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Syvanen</surname> <given-names>A. C.</given-names></name></person-group> (<year>2001</year>). <article-title>Accessing genetic variation: genotyping single nucleotide polymorphisms</article-title>. <source>Nat. Rev. Genet.</source> <volume>2</volume>, <fpage>930</fpage>&#x02013;<lpage>942</lpage>. <pub-id pub-id-type="doi">10.1038/35103535</pub-id><pub-id pub-id-type="pmid">11733746</pub-id></citation></ref>
<ref id="B76">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tamura</surname> <given-names>K.</given-names></name> <name><surname>Stecher</surname> <given-names>G.</given-names></name> <name><surname>Peterson</surname> <given-names>D.</given-names></name> <name><surname>Filipski</surname> <given-names>A.</given-names></name> <name><surname>Kumar</surname> <given-names>S.</given-names></name></person-group> (<year>2013</year>). <article-title>MEGA6: molecular evolutionary genetics analysis version 6.0</article-title>. <source>Mol. Biol. Evol.</source> <volume>30</volume>, <fpage>2725</fpage>&#x02013;<lpage>2729</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst197</pub-id><pub-id pub-id-type="pmid">24132122</pub-id></citation></ref>
<ref id="B77">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thachuk</surname> <given-names>C.</given-names></name> <name><surname>Crossa</surname> <given-names>J.</given-names></name> <name><surname>Franco</surname> <given-names>J.</given-names></name> <name><surname>Dreisigacker</surname> <given-names>S.</given-names></name> <name><surname>Warburton</surname> <given-names>M.</given-names></name> <name><surname>Davenport</surname> <given-names>G. F.</given-names></name></person-group> (<year>2009</year>). <article-title>Core Hunter: an algorithm for sampling genetic resources based on multiple genetic measures</article-title>. <source>BMC Bioinform.</source> <volume>10</volume>:<fpage>243</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-10-243</pub-id><pub-id pub-id-type="pmid">19660135</pub-id></citation></ref>
<ref id="B78">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tiwari</surname> <given-names>K. K.</given-names></name> <name><surname>Singh</surname> <given-names>A.</given-names></name> <name><surname>Pattnaik</surname> <given-names>S.</given-names></name> <name><surname>Sandhu</surname> <given-names>M.</given-names></name> <name><surname>Kaur</surname> <given-names>S.</given-names></name> <name><surname>Jain</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Identification of a diverse mini-core panel of Indian rice germplasm based on genotyping using microsatellite markers</article-title>. <source>Plant Breed.</source> <volume>134</volume>, <fpage>164</fpage>&#x02013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1111/pbr.12252</pub-id></citation></ref>
<ref id="B79">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Hintum</surname> <given-names>T. J. L.</given-names></name> <name><surname>Brown</surname> <given-names>A. H. D.</given-names></name> <name><surname>Spillane</surname> <given-names>C.</given-names></name> <name><surname>Hodgkin</surname> <given-names>T.</given-names></name></person-group> (<year>2000</year>). <article-title>Core collections of plant genetic resources</article-title>. <source>IPGRI Tech. Bull.</source> <volume>3</volume>, <fpage>1</fpage>&#x02013;<lpage>48</lpage>.</citation></ref>
<ref id="B80">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Haberer</surname> <given-names>G.</given-names></name> <name><surname>Marri</surname> <given-names>P. R.</given-names></name> <name><surname>Fan</surname> <given-names>C.</given-names></name> <name><surname>Goicoechea</surname> <given-names>J. L.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>The genome sequence of African rice (<italic>Oryza glaberrima</italic>) and evidence for independent domestication</article-title>. <source>Nat. Genet.</source> <volume>46</volume>, <fpage>982</fpage>&#x02013;<lpage>988</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3044</pub-id><pub-id pub-id-type="pmid">25064006</pub-id></citation></ref>
<ref id="B81">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Warburton</surname> <given-names>M. L.</given-names></name> <name><surname>Setimela</surname> <given-names>P.</given-names></name> <name><surname>Franco</surname> <given-names>J.</given-names></name> <name><surname>Cordova</surname> <given-names>H.</given-names></name> <name><surname>Pixley</surname> <given-names>K.</given-names></name> <name><surname>Banziger</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Toward a cost-effective fingerprinting methodology to distinguish maize open-pollinated varieties</article-title>. <source>Crop Sci</source>. <volume>50</volume>, <fpage>467</fpage>&#x02013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.2135/cropsci2009.02.0089</pub-id></citation></ref>
<ref id="B82">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wright</surname> <given-names>S.</given-names></name></person-group> (<year>1943</year>). <article-title>Isolation by distance</article-title>. <source>Genetics</source> <volume>28</volume>, <fpage>39</fpage>&#x02013;<lpage>156</lpage>. <pub-id pub-id-type="pmid">17247074</pub-id></citation></ref>
<ref id="B83">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wright</surname> <given-names>S.</given-names></name></person-group> (<year>1978</year>). <source>Evolution and the Genetics of Populations: Variability within and Among Natural Populations</source>. <publisher-loc>Chicago, IL</publisher-loc>: <publisher-name>University of Chicago Press</publisher-name>.</citation></ref>
<ref id="B84">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wright</surname> <given-names>S. I.</given-names></name> <name><surname>Bi</surname> <given-names>I. V.</given-names></name> <name><surname>Schroeder</surname> <given-names>S. G.</given-names></name> <name><surname>Yamasaki</surname> <given-names>M.</given-names></name> <name><surname>Doebley</surname> <given-names>J. F.</given-names></name> <name><surname>McMullen</surname> <given-names>M. D.</given-names></name> <etal/></person-group>. (<year>2005</year>). <article-title>The effects of artificial selection on the maize genome</article-title>. <source>Science</source> <volume>308</volume>, <fpage>1310</fpage>&#x02013;<lpage>1314</lpage>. <pub-id pub-id-type="doi">10.1126/science.1107891</pub-id><pub-id pub-id-type="pmid">15919994</pub-id></citation></ref>
<ref id="B85">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>W.</given-names></name> <name><surname>Rutger</surname> <given-names>J. N.</given-names></name> <name><surname>Bryant</surname> <given-names>R. J.</given-names></name> <name><surname>Bockelman</surname> <given-names>H. E.</given-names></name> <name><surname>Fjellstrom</surname> <given-names>R. G.</given-names></name> <name><surname>Ming-Hsuan</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Development and evaluation of a core subset of the USDA rice germplasm collection</article-title>. <source>Crop Sci.</source> <volume>47</volume>, <fpage>869</fpage>&#x02013;<lpage>878</lpage>. <pub-id pub-id-type="doi">10.2135/cropsci2006.07.0444</pub-id></citation></ref>
<ref id="B86">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>X.</given-names></name> <name><surname>Gao</surname> <given-names>S.</given-names></name> <name><surname>Xu</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Prasanna</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>L.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Characterization of a global germplasm collection and its potential utilization for analysis of complex quantitative traits in maize</article-title>. <source>Mol. Breed.</source> <volume>28</volume>, <fpage>511</fpage>&#x02013;<lpage>526</lpage>. <pub-id pub-id-type="doi">10.1007/s11032-010-9500-7</pub-id></citation></ref>
<ref id="B87">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>X.</given-names></name> <name><surname>Ren</surname> <given-names>R.</given-names></name> <name><surname>Ray</surname> <given-names>R.</given-names></name> <name><surname>Xu</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>P.</given-names></name> <name><surname>Zhang</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Genetic diversity and population structure of core watermelon (<italic>Citrullus lanatus</italic>) genotypes using DArTseq-based SNPs</article-title>. <source>Plant Genet Res</source>. <volume>14</volume>, <fpage>226</fpage>&#x02013;<lpage>233</lpage>. <pub-id pub-id-type="doi">10.1017/S1479262115000659</pub-id></citation></ref>
<ref id="B88">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>W.</given-names></name> <name><surname>Cho</surname> <given-names>G.-T.</given-names></name> <name><surname>Ma</surname> <given-names>K.-H.</given-names></name> <name><surname>Chung</surname> <given-names>J.-W.</given-names></name> <name><surname>Gwag</surname> <given-names>J.-G.</given-names></name> <name><surname>Park</surname> <given-names>Y.-J.</given-names></name></person-group> (<year>2010</year>). <article-title>Development of an allele-mining set in rice using a heuristic algorithm and SSR genotype data with least redundancy for the post-genomic era</article-title>. <source>Mol. Breed.</source> <volume>26</volume>, <fpage>639</fpage>&#x02013;<lpage>651</lpage>. <pub-id pub-id-type="doi">10.1007/s11032-010-9400-x</pub-id></citation></ref>
</ref-list> 
</back>
</article>
