<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2021.775051</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>High-Quality Genomes and High-Density Genetic Map Facilitate the Identification of Genes From a Weedy Rice</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Fei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1476457/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Han</surname> <given-names>Zhenyun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Qiao</surname> <given-names>Weihua</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/488859/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Junrui</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/998634/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Song</surname> <given-names>Yue</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Cui</surname> <given-names>Yongxia</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Jiaqi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ge</surname> <given-names>Jinyue</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Lou</surname> <given-names>Danjing</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Fan</surname> <given-names>Weiya</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Danting</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Nong</surname> <given-names>Baoxuan</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Zongqiong</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Cheng</surname> <given-names>Yunlian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Lifang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zheng</surname> <given-names>Xiaoming</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/829734/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yang</surname> <given-names>Qingwen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>National Key Facility for Crop Gene Resources and Genetic Improvement, Institute of Crop Sciences, Chinese Academy of Agricultural Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Guangxi Key Laboratory for Polysaccharide Materials and Modifications, School of Marine Sciences and Biotechnology, Guangxi University for Nationalities</institution>, <addr-line>Nanning</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>School of Clinical Medicine, Southwest Medical University</institution>, <addr-line>Luzhou</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Little Berry Research Room, Liaoning Institute of Fruit Science</institution>, <addr-line>Yingkou</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Guangxi Key Laboratory of Rice Genetics and Breeding, Rice Research Institute, Guangxi Academy of Agricultural Sciences</institution>, <addr-line>Nanning</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Andr&#x00E9;s J. Cort&#x00E9;s, Colombian Corporation for Agricultural Research (AGROSAVIA), Colombia</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Maria Fernanda Alvarez, Rice Program International Centre for Tropical Agriculture (CIAT), Colombia; Joong Hyoun Chin, Sejong University, South Korea</p></fn>
<corresp id="c001">&#x002A;Correspondence: Xiaoming Zheng, <email>zhengxiaoming@caas.cn</email></corresp>
<corresp id="c002">Qingwen Yang, <email>yangqingwen@caas.cn</email></corresp>
<fn fn-type="equal" id="fn002"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn fn-type="other" id="fn004"><p>This article was submitted to Plant Breeding, a section of the journal Frontiers in Plant Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>11</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>775051</elocation-id>
<history>
<date date-type="received">
<day>13</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>10</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2021 Li, Han, Qiao, Wang, Song, Cui, Li, Ge, Lou, Fan, Li, Nong, Zhang, Cheng, Zhang, Zheng and Yang.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Li, Han, Qiao, Wang, Song, Cui, Li, Ge, Lou, Fan, Li, Nong, Zhang, Cheng, Zhang, Zheng and Yang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Genes have been lost or weakened from cultivated rice during rice domestication and breeding. Weedy rice (<italic>Oryza sativa</italic> f. <italic>spontanea</italic>) is usually recognized as the progeny between cultivated rice and wild rice and is also known to harbor an gene pool for rice breeding. Therefore, identifying genes from weedy rice germplasms is an important way to break the bottleneck of rice breeding. To discover genes from weedy rice germplasms, we constructed a genetic map based on w-hole-genome sequencing of a F<sub>2</sub> population derived from the cross between LM8 and a cultivated rice variety. We further identified 31 QTLs associated with 12 important agronomic traits and revealed that <italic>ORUFILM03g000095</italic> gene may play an important role in grain length regulation and participate in grain formation. To clarify the genomic characteristics from weedy rice germplasms of LM8, we generated a high-quality genome assembly using single-molecule sequencing, Bionano optical mapping, and Hi-C technologies. The genome harbored a total size of 375.8 Mb, a scaffold N50 of 24.1 Mb, and originated approximately 0.32 million years ago (Mya) and was more closely related to <italic>Oryza sativa</italic> ssp. <italic>japonica</italic>. and contained 672 unique genes. It is related to the formation of grain shape, heading date and tillering. This study generated a high-quality reference genome of weedy rice and high-density genetic map that would benefit the analysis of genome evolution for related species and suggested an effective way to identify genes related to important agronomic traits for further rice breeding.</p>
</abstract>
<kwd-group>
<kwd>weedy rice</kwd>
<kwd>genetic map</kwd>
<kwd>QTL mapping</kwd>
<kwd>reference genome</kwd>
<kwd>comparative genomics</kwd>
</kwd-group>
<contract-num rid="cn001">31670211</contract-num>
<contract-num rid="cn001">31970237</contract-num>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content></contract-sponsor>
<contract-sponsor id="cn002">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content></contract-sponsor>
<counts>
<fig-count count="8"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="111"/>
<page-count count="16"/>
<word-count count="10491"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>Introduction</title>
<p>Cultivated rice is one of the most important staple crops worldwide. The breeding of rice varieties with improved yield, quality, resistance to diseases and pests, and tolerance to abiotic stresses is significant to meet the increasing food demand in China and the world (<xref ref-type="bibr" rid="B37">Khush, 2001</xref>; <xref ref-type="bibr" rid="B102">Yang and Hwa, 2008</xref>; <xref ref-type="bibr" rid="B98">Xu et al., 2021</xref>). However, many genes have been lost from cultivated rice due to the long-term domestication and artificial selection, which hinders the breeding of advanced rice varieties. To the contrary, wild rice growing in natural environments is resistant or tolerant to different biotic and abiotic stresses and therefore retains a natural gene pool containing a large number of genes that have been lost or weakened from cultivated rice (<xref ref-type="bibr" rid="B83">Sun et al., 2002</xref>). Weedy rice has many characteristic traits similar to those of wild rice, many studies indicated that weedy rice was originated from wild rice and serves as a transition type between wild rice and cultivated rice (<xref ref-type="bibr" rid="B3">Baker, 1974</xref>; <xref ref-type="bibr" rid="B96">Wet and Harlan, 1975</xref>; <xref ref-type="bibr" rid="B12">Cho et al., 1995</xref>). Previous studies showed that weedy rice harbors the AA genome and no reproductive isolation was observed between weedy rice and cultivated rice (<xref ref-type="bibr" rid="B60">Nadir et al., 2018</xref>; <xref ref-type="bibr" rid="B84">Sun et al., 2019</xref>). Generally, the genes of weedy rice can be transferred to cultivated rice through breeding techniques such as hybridization and backcrossing (<xref ref-type="bibr" rid="B52">Lu et al., 2000</xref>; <xref ref-type="bibr" rid="B82">Stein et al., 2018</xref>). Weedy rice has been usually used as the genetic materials for rice genetics and breeding or to identify genes related to stress tolerance, disease and pest resistance, high yield, and high grain quality for improving modern rice varieties (<xref ref-type="bibr" rid="B33">Ishikawa et al., 2005</xref>; <xref ref-type="bibr" rid="B73">Shivrain et al., 2010</xref>; <xref ref-type="bibr" rid="B14">Dai et al., 2013</xref>).</p>
<p>In the past decades, rice functional genomics research, which focuses on technology platform construction and molecular cloning and functional analysis of genes related to important agronomic traits, has resulted in numerous achievements in gene discovery (<xref ref-type="bibr" rid="B23">Han et al., 2007</xref>; <xref ref-type="bibr" rid="B98">Xu et al., 2021</xref>). Due to its small genome and relatively simple structure, <italic>Oryza sativa</italic> (9311 and Nipponbare) became the first sequenced rice species in 2002 (<xref ref-type="bibr" rid="B19">Goff et al., 2002</xref>; <xref ref-type="bibr" rid="B105">Yu et al., 2002</xref>). These rice reference genomes have enabled massive rice functional genomics research, accelerated rice genetic improvement, and laid a foundation for studying genomes of other crops such as <italic>Zea mays</italic> (<xref ref-type="bibr" rid="B70">Schnable et al., 2009</xref>) and <italic>Triticum aestivum</italic> (<xref ref-type="bibr" rid="B32">International Wheat Genome Sequencing Consortium [IWGSC], 2014</xref>). With the development of sequencing technology, the time required for sequencing has largely decreased while the sequencing quality has greatly improved, therefore resulting in more high-quality reference genomes of cultivated rice varieties such as MH63, ZH97, and R498 (<xref ref-type="bibr" rid="B108">Zhang et al., 2016</xref>, <xref ref-type="bibr" rid="B109">2018</xref>; <xref ref-type="bibr" rid="B16">Du et al., 2017</xref>). The focus of rice research has also been gradually turned to elucidate biological characteristics and evolution processes and to analyze gene functions and related biological issues at the genomic level, as well as to identify genes related to important agronomic traits such as high yield, high quality, and stress resistance (<xref ref-type="bibr" rid="B28">Huang et al., 2010</xref>, <xref ref-type="bibr" rid="B30">2011</xref>, <xref ref-type="bibr" rid="B29">2015</xref>; <xref ref-type="bibr" rid="B99">Xun et al., 2012</xref>; <xref ref-type="bibr" rid="B95">Wei et al., 2014</xref>; <xref ref-type="bibr" rid="B104">Yano et al., 2016</xref>).</p>
<p>At present, numerous genes related to important agronomic traits (e.g., grain size) have been located and cloned, such as GS3 (<xref ref-type="bibr" rid="B18">Fan et al., 2006</xref>; <xref ref-type="bibr" rid="B56">Mao et al., 2018</xref>), GL3.1 (<xref ref-type="bibr" rid="B66">Qi et al., 2012</xref>), DEP1 (<xref ref-type="bibr" rid="B27">Huang et al., 2009</xref>), GW2 (<xref ref-type="bibr" rid="B76">Song et al., 2007</xref>), <italic>qSW5</italic> (<xref ref-type="bibr" rid="B74">Shomura et al., 2008</xref>), <italic>GW8</italic> (<xref ref-type="bibr" rid="B91">Wang et al., 2012b</xref>), and <italic>GS5</italic> (<xref ref-type="bibr" rid="B47">Li et al., 2011</xref>). Although the genome assembly of weedy rice WR04-6 has been constructed (<xref ref-type="bibr" rid="B84">Sun et al., 2019</xref>), the progress of identifying genes from weedy rice and the functional genomics research remains hindered due to a lack of more high-quality reference genomes. Generally, the morphological characteristics of weedy rice is between wild rice (<italic>O. rufipogon</italic>) and cultivated rice (<italic>O. sativa</italic> L.) (<xref ref-type="bibr" rid="B85">Sun et al., 2013</xref>; <xref ref-type="bibr" rid="B13">Cui et al., 2016</xref>). Our previous taxonomic study showed that LM8 is a low heterozygous weedy rice germplasm. The plants are homozygous and can be inherited stably that is characterized by very small grains. To discover genes from weedy rice germplasms of LM8, we constructed a genetic map based on whole-genome sequencing of a F<sub>2</sub> population derived from the cross between LM8 and a cultivated rice variety. In combination with the phenotypic data of 12 important agronomic traits collected from the F<sub>2</sub> population, we also tried to identify some new genes from the weedy rice. Moreover, to clarify the genomic characteristics from weedy rice germplasms of LM8, we generated a high-quality genome assembly of LM8 based on the Nanopore sequencing technology and characterized the LM8 genome to reveal its evolutionary relationship, which broadens our understanding of weedy rice at the genomic level. Based on our study, we found that the combination of genetic map and genome map is critical to quickly discover candidate genes such as plant-type, panicle-type, and gain-size in weed rice.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Plant Materials</title>
<p>The weedy rice LM8 was obtained from the China National Genebank. It shows erect and compact architecture similar to cultivated rice and harbors typical characteristics, such as small grain size and black hull. The cultivated rice variety Shen 08S was provided by the Anhui Academy of Agricultural Sciences. A F<sub>2</sub> population (1229 samples) was obtained from a cross between LM8 and Shen 08S and was planted in the experimental fields under natural growth conditions in Nanning, Guangxi Autonomous Region, China. In this study, the F2 population were collected from one F1. Fresh and healthy leaves were collected at seedling stage and stored at 80&#x00B0;C for subsequent genomic DNA extraction.</p>
</sec>
<sec id="S2.SS2">
<title>Population Sequencing and Genetic Map Construction</title>
<p>Fresh leaves of randomly selected 199 samples of the F<sub>2</sub> population and their parents (LM8 and Shen 08S) were used to extract genomic DNA with the cetyltrimethylammonium bromide (CTAB) method. The Illumina PE150 libraries were constructed according to the manufacturer&#x2019;s instructions and sequenced on an Illumina HiSeq X Ten platform. The two parental genotypes were sequenced at a higher depth (20 &#x00D7; coverage) to obtain 10 Gb data each, and F<sub>2</sub> individuals were sequenced at a lower depth (&#x223C; 10 &#x00D7; coverage) to obtain 5 Gb data each. Low-quality reads were removed to obtain clean reads, which were then mapped to the LM8 genome (LM8_v1) using BWA (mem -t 4 -k 32 -M -R) (<xref ref-type="bibr" rid="B42">Li and Durbin, 2009</xref>). SAMtools (sort rmup) (<xref ref-type="bibr" rid="B43">Li et al., 2009</xref>) was used to convert and sort the mapping results and to remove PCR duplicate reads. The clean reads of each F<sub>2</sub> individual that passed the quality control were mapped to the reference genome (LM8_v1) for haplotype-based SNP calling. Development of polymorphic markers was performed by GATK (<xref ref-type="bibr" rid="B58">McKenna et al., 2010</xref>) for SNP identification and genotyping, and a total of 2,373,849 SNP markers were obtained. Then, these SNP markers were filtered by removing abnormal bases, abnormal genotypes, incomplete coverage markers, and segregation distortion markers, and were sorted into LGs (<xref ref-type="bibr" rid="B100">Yang et al., 2018</xref>). After filtering, 10,739 SNP markers were cluster into 12 LGs using JoinMap v4.1 (Mapping algorithm&#x2014;ML Mapping, Regression mapping&#x2014;Kosambi&#x2019;s) (<xref ref-type="bibr" rid="B78">Stam, 1993</xref>).</p>
</sec>
<sec id="S2.SS3">
<title>Phenotypic Evaluation of the F<sub>2</sub> Population</title>
<p>We collected the main culm of plant individuals at 25 days after heading to measure the plant height (PH), tillering number (TN), flag leaf length (FLL), and flag leaf width (FLW) using a ruler. At maturity, the main panicles of plant individuals were harvested to measure panicle length (PL) using a ruler, and the primary branch number (PB) and secondary branch number (SB) (<xref ref-type="bibr" rid="B55">Ma et al., 2016</xref>) were recorded. The filled grains were used to calculate the grain length (GL), grain width (GW), grain thickness (GT), length width ratio (LWR), and thousand-grain weight (TGW) using an automatic seed analyzer with three replicates (Wanshen Detection Technology, Hangzhou, China). The analysis of variance (ANOVA) and correlations of phenotypic characteristics collected from the F<sub>2</sub> population were conducted in R v3.6.2 (<xref ref-type="bibr" rid="B40">Langfelder and Horvath, 2012</xref>).</p>
</sec>
<sec id="S2.SS4">
<title>QTL Mapping and Candidate Gene Prediction</title>
<p>QTL mapping was conducted using a permutation test (<italic>n</italic> = 1,000) in MapQTL6.0 with the composite interval mapping method to determine the limit of detection (LOD) value of each phenotype (<xref ref-type="bibr" rid="B63">Ooijen et al., 2009</xref>). Then the CIM mapping method in Win QTL Cartographer v2.5 software was used to locate the QTL position, contribution rate, and additive effect (<xref ref-type="bibr" rid="B92">Wang et al., 2012a</xref>). The 99% confidence interval of a QTL were determined as a candidate region, in which genes harbored non-synonymous coding mutations, premature or extended termination mutations were regarded as functional genes.</p>
</sec>
<sec id="S2.SS5">
<title>Genome Library Construction and Sequencing</title>
<p>Genomic DNA was extracted from the fresh leaves of LM8 using Genomic kit (13343, Qiagen, Germany). Total RNA was extracted from five different tissues (root, leaf, stem, flower, and spike) by using the TRNzol Universal Total RNA extraction Kit (DP424, Tiangen, China). The total RNA was reserve transcribed into cDNA using SMARTer PCR cDNA Synthesis Kit (634926, Takara, China). PCR was performed using PrimeSTAR GXL DNApolymerase (R050A, Takara, China). The purity, concentration, and integrity of DNA and RNA were determined using NanoDrop&#x2122; One UV-Vis spectrophotometer (Thermo Fisher Scientific, United States), Qubit<sup>&#x00AE;</sup> 3.0 Fluorometer (Invitrogen, United States) and Agilent 2100 Bioanalyzer (Agilent technologies, United States).</p>
<p>A library for Illumina paired-end sequencing with an insert size of 350&#x2013;500 bp was constructed and sequenced on an Illumina HiSeq X ten platform (Illumina, San Diego, CA, United States). Oxford Nanopore library preparation was conducted according to the manufacturer&#x2019;s instruction (13343, Qiagen, Germany) and sequenced on a PromethION platform (Oxford Nanopore Technologies, Oxford, United Kingdom). Fresh young leaves were vacuum-infiltrated with formaldehyde solution and used for cross-link action. The Hi-C library was prepared following the manufacturer&#x2019;s protocol and sequenced on an Illumina HiSeq X ten platform. SMRTbell library of RNA-seq was constructed from a pooled cDNA sample of five different tissue (root, leaf, stem, flower, and spike) using SMRTbell template prep kit 2.0 (100222300, Pacific Biosciences, United States) and sequenced on a PacBio Sequel sequencer (Pacific Biosciences, Menlo Park, United States) to obtain full-length transcriptome data.</p>
</sec>
<sec id="S2.SS6">
<title>Genome Assembly</title>
<p>The Illumina short reads were filtered using fastp v0.20.0 with default parameters (<xref ref-type="bibr" rid="B11">Chen et al., 2018</xref>). The abundance of 17 nt K-mers (-C -m 17 -s 400M) was used to estimate the genome size and heterozygous rate (<xref ref-type="bibr" rid="B57">Mar&#x00E7;ais and Kingsford, 2011</xref>; <xref ref-type="bibr" rid="B48">Liu et al., 2013</xref>; <xref ref-type="bibr" rid="B38">Koren et al., 2017</xref>). Correction of long reads generated from the Oxford Nanopore PromethION platform and <italic>de novo</italic> assembly were performed by <italic>NextDenovo</italic> v1.1.1 (read_cuoff = 2 k, seed_cutoff = 23 k, blocksize = 1 g, pa_raw_align = 20, pa_correction = 35) and <italic>SMARTdenovo</italic> (-e dom -J 5000 -k 17) (<xref ref-type="bibr" rid="B49">Loman et al., 2015</xref>; <xref ref-type="bibr" rid="B8">Cali et al., 2018</xref>). The Illumina short reads were mapped to the initial sequence assembly using BWA v0.7.12-r1039 with default parameters, which was then iteratively polished with three rounds of correction using NextPolish v3.0.1 (-max_depth 100 cluster_optons = -w n -l vf = {vf} -q all.q -pe smp {cpu} genome_size = auto) (<xref ref-type="bibr" rid="B88">Walker et al., 2014</xref>; <xref ref-type="bibr" rid="B24">Hu et al., 2020</xref>). Purge Haplotigs software was used to generate a contig-level assembly with only one copy of each of the contigs from heterozygous regions. The completeness of the draft genome was assessed by BUSCO v3 with the embryophyta_odb9 database (<xref ref-type="bibr" rid="B75">Sim&#x00E3;o et al., 2015</xref>).</p>
<p>Ultra-high-molecular-weight (uHMW) DNA (DNA length &#x003E; 250 kb) were extracted using Bionano Prep Plant DNA Isolation Kit (80003; Bionano Genomics, United States) according to the manufacturer&#x2019;s instructions. uHMW DNA molecules were labeled with the DLE-1 enzyme and loaded onto a Saphyr Chip and scanned for images on a Bionano Saphyr system (Bionano Genomics, San Diego, CA, United States). The raw molecules generated were quality-controlled and filtered (molecules with a size &#x003C; 150 kb were removed). An optical map was generated using Bionano Solve package v3.4. The generated optical map was used to construct scaffolds using the Hybrid Scaffold pipeline of Bionano Solve package v3.4 (CL.py -d -U -N 6 -y -i 3 -F 1 -a opt Arguments_non-haplotype_noES_noCut_saphyr.xml) and Bionano Access v1.5.2 (Bionano Genomics, San Diego, CA, United States) with a more stringent (1e-13) merging <italic>p</italic>-value threshold (<xref ref-type="bibr" rid="B97">Xiao et al., 2007</xref>; <xref ref-type="bibr" rid="B69">Reisner et al., 2010</xref>; <xref ref-type="bibr" rid="B59">Mostovoy et al., 2016</xref>). The Hi-C raw reads were filtered by fastp v0.12.6 with default parameters and then mapped to the scaffolds with Bowtie2 (<xref ref-type="bibr" rid="B41">Langmead and Salzberg, 2012</xref>; <xref ref-type="bibr" rid="B11">Chen et al., 2018</xref>). We used Lachesis (ligating adjacent chromatin enables scaffolding <italic>in situ</italic>) to cluster, order, and anchor scaffolds onto the chromosomes (<xref ref-type="bibr" rid="B7">Burton et al., 2013</xref>; <xref ref-type="bibr" rid="B17">Dudchenko et al., 2017</xref>).</p>
</sec>
<sec id="S2.SS7">
<title>Annotation of Genome</title>
<p>The repeat sequences and elements were annotated by a combination of <italic>de novo</italic> and homology-based methods. LTR_FINDER (<xref ref-type="bibr" rid="B22">Haas et al., 2008</xref>) and RepeatModeler (<xref ref-type="bibr" rid="B21">Haas et al., 2003</xref>) were used to generate a dataset of repetitive sequences with default parameters. This dataset was BLAST against the Plant Genome and Systems Biology (PGSB) repeat element database to classify the repeats (<xref ref-type="bibr" rid="B77">Spannagl et al., 2016</xref>), and then RepeatMasker was employed to annotate these repeats based on the Repbase database (<xref ref-type="bibr" rid="B4">Bao et al., 2015</xref>). Further, tandem repeats finder software was used to identify tandem repeats (<xref ref-type="bibr" rid="B6">Benson, 1999</xref>).</p>
<p>The protein-coding genes of the LM8 genome were predicted through a comprehensive strategy that combined results obtained from <italic>de novo</italic>, homology-based, and transcriptome-based predictions. Augustus was used for <italic>de novo</italic> prediction with Hidden Markov Model (<xref ref-type="bibr" rid="B80">Stanke et al., 2008</xref>). Homologous proteins from six plant genomes (<italic>Arabidopsis thaliana</italic>, <italic>O. sativa</italic>, <italic>Zea mays</italic>, <italic>Hordeum vulgare</italic>, <italic>Physcomitrella patens</italic>, and <italic>Triticum aestivum</italic>) were downloaded from Ensembl plants<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> and used for homology-based prediction by GeMoMa (<xref ref-type="bibr" rid="B35">Jens et al., 2016</xref>). The non-redundant full-length transcripts obtained from the PacBio Sequel platform were aligned to the LM8 genome assembly for transcriptome-based prediction using PASA (<xref ref-type="bibr" rid="B21">Haas et al., 2003</xref>).</p>
<p>Gene structures were determined based on a combination of results from the three prediction methods using EvidenceModeler (<xref ref-type="bibr" rid="B22">Haas et al., 2008</xref>). Functional annotation of protein-coding genes was achieved by BLASTP searches against the Swiss-Prot database (<xref ref-type="bibr" rid="B81">Stanke and Waack, 2003</xref>). Protein domains were annotated by searching against the InterPro database using InterProScan (<xref ref-type="bibr" rid="B106">Zdobnov and Apweiler, 2001</xref>; <xref ref-type="bibr" rid="B31">Hunter et al., 2009</xref>). Non-coding RNA genes, including miRNA, snRNA, and rRNA genes were predicted according to the Rfam database, while tRNA genes were identified using tRNAscan-SE (<xref ref-type="bibr" rid="B51">Lowe and Eddy, 1997</xref>; <xref ref-type="bibr" rid="B20">Griffiths-Jones et al., 2005</xref>). The completeness of the predicted gene set was assessed by BUSCO v3 with the embryophyta_odb9 database (<xref ref-type="bibr" rid="B6">Benson, 1999</xref>).</p>
</sec>
<sec id="S2.SS8">
<title>Collinearity Analysis</title>
<p>Protein sequences of LM8, <italic>japonica</italic> var. Nipponbare, and <italic>indica</italic> var. R498 were aligned by BLASTP v2.6.0 with default settings. Syntenic gene blocks within the genome were detected by MCScanX (<xref ref-type="bibr" rid="B93">Wang et al., 2012c</xref>) and visualized using the jcvi python module.</p>
</sec>
<sec id="S2.SS9">
<title>Identification of Gene Families</title>
<p>Gene family identification was performed across LM8 (<italic>O. sativa</italic> f. <italic>spontanea</italic>), <italic>O. aus</italic> (AUS), 5 cultivated rice varieties, and 11 wild rice species. The 5 cultivated rice varieties included <italic>O. sativa</italic> ssp. <italic>indica</italic> (IND), <italic>O. sativa</italic> ssp. <italic>japonica</italic> (JAP), <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Minghui63 (MH63), <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Zhenshan97 (ZS97), <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Shuhui498 (R498). The 11 wild rice species consisted of <italic>O. glaberrima</italic> (GLA), <italic>O. barthii</italic> (BAR), <italic>O. glumaepatula</italic> (GLU), <italic>O. meridionalis</italic> (MER), <italic>O. rufipogon</italic> (RUF), <italic>O. nivara</italic> (NIV), <italic>O. longistaminata</italic> (LON), <italic>O. punctata</italic> (PUN), <italic>O. brachyantha</italic> (BRA), <italic>O. rufipogon</italic> var. JX-6 (JX-6), and <italic>O. rufipogon</italic> var. Z59 (Z59). PUN and BRA belong to the BB and FF genomes, respectively, while the others belong to the AA genome. Across all species, the longest transcript of each gene was used in further analyses. Orthologous and paralogous gene clusters were identified using BLASTP (-e 1e-5 -F F). Clustering analysis of protein sequences from the 18 <italic>Oryza</italic> genomes was conducted with OrthoMCL (<xref ref-type="bibr" rid="B44">Li et al., 2003</xref>).</p>
</sec>
<sec id="S2.SS10">
<title>Phylogenetic Analysis</title>
<p>Multiple sequence alignments of the protein-coding sequences of the 4,241 single-copy orthologous genes obtained from the above analysis these protein sequences were performed by MAFFT (<xref ref-type="bibr" rid="B36">Katoh and Standley, 2013</xref>). Phylogenetic relationships were resolved using RAxML (-m GTRGAMMA -p 12345 -T 8 -f b -t -z) among these 18 <italic>Oryza</italic> genomes with all single-copy genes concatenated into an ultra-long aligned sequence, where <italic>O. brachyantha</italic> was designated as an outgroup (<xref ref-type="bibr" rid="B79">Stamatakis, 2014</xref>). Divergence times were estimated by MCMCtree (<xref ref-type="bibr" rid="B65">Puttick, 2019</xref>) with parameters of &#x201C;RootAge &#x2264; 0.21, rgene gamma = 23.52254, burnin = 100,000, sampfreq = 100, nsample = 50,000, model = 7&#x201D; in the PAML package (<xref ref-type="bibr" rid="B61">Nikolau et al., 2003</xref>) based on a known divergence time (&#x223C; 0.4 Mya) between <italic>O. nivara</italic> and <italic>O. rufipogon</italic>.</p>
</sec>
<sec id="S2.SS11">
<title>Expansion and Contraction of Gene Families</title>
<p>A random birth-and-death model was used to estimate changes in gene families between the ancestor and each species using CAFE with conditional likelihoods as the test statistics (-p 0.05 -t 10 -r 10000 lambda -s) (<xref ref-type="bibr" rid="B15">De Bie et al., 2006</xref>). A probabilistic graphical model (PGM) was used to calculate the probability of transitions in each gene family, and then all the gene families were classified into three types (expanded, contracted, and unchanged). Finally, GO enrichment was performed for further functional analysis of the expanded genes.</p>
</sec>
<sec id="S2.SS12">
<title>Positive Selection Analysis</title>
<p>All orthologous genes identified in the LM8 genome were tested for positive selection. The phylogenetic tree generated by RAxML was used as the input, and the branch-site test was conducted with CodeML (model = 2, NSsites = 2, fix_omega = 0, fix_omega = 1, omega = 1) in the PAML package (<xref ref-type="bibr" rid="B103">Yang, 2007</xref>). Genes under positive selection were determined based on the likelihood ratio test (<italic>P</italic> &#x003C; 0.01).</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>Results</title>
<sec id="S3.SS1">
<title>Genetic Map Construction and QTL Analysis With a F<sub>2</sub> Population</title>
<p>To further understand the mechanism of LM8 genome variation in its special grain formation, a F<sub>2</sub> population was generated from the cross between LM8 and a cultivated rice variety Shen 08S. The two parents, LM8 and Shen 08S, showed obvious differences in plant height, panicle length, and grain size (<xref ref-type="fig" rid="F1">Figure 1</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 1</xref>). We sequenced the genome of F<sub>2</sub> individuals as well as that of the two parents. A total of 10,739 high-quality SNPs were obtained and used to generate a genetic map. The total genetic distance of the constructed genetic map was 12,171.13 cM, and the average genetic distance between two SNPs was 1.13 cM (<xref ref-type="fig" rid="F1">Figure 1</xref>). The SNPs were distributed throughout the 12 linkage groups (LGs) with the highest SNP number (1,754) occurring on LG1 (1,510.48 cM total size) and the lowest (523) on LG12 (713.79 cM total size). Collinearity analysis showed that the genetic map had strong collinearity (99.69%) with the reference genome sequence (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 1</xref>), and the sources of most segments in F<sub>2</sub> individuals were consistent according to the monomer source analysis. These results suggest that the constructed genetic map is of high-quality and suitable for further analyses.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Agronomic characteristics of LM8 and Shen 08S (parents) and the genetic map constructed based on the F<sub>2</sub> population. <bold>(A)</bold> Plant height of LM8 (right) and Shen 08S (left). Bar = 10 cm. <bold>(B)</bold> Panicle length of LM8 (right) and Shen 08S (left). Bar = 0.5 cm. <bold>(C)</bold> Branches of LM8 (right) and Shen 08S (left). Bar = 2 cm. <bold>(D)</bold> Grain size of LM8 (bottom) and Shen 08S (above). Bar = 1 cm. <bold>(E)</bold> Genomic locations of 12 agronomic trait associated QTLs are illustrated on the 12 linkage groups. PH, plant height; TN, tillering number; FLL, flag leaf length; FLW, flag leaf width; PL, panicle length; PB, primary branch number; SB, secondary branch number; GL, grain length; GW, grain width; GT, grain thickness; LWR, length to width ratio; TGW, thousand-grain weight.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g001.tif"/>
</fig>
<p>Besides, combining the phenotypic data (<xref ref-type="fig" rid="F2">Figure 2</xref>) obtained from the F<sub>2</sub> population and the genetic map, we identified 31 quantitative trait loci (QTLs) with 607 genes related to 4 plant-type traits, 3 panicle-type traits, and 5 grain-size traits (<xref ref-type="fig" rid="F1">Figure 1</xref>). Eight of the QTLs explaining more than 17% of the phenotypical variation were identified as major QTLs, which were located at 788.3&#x2013;789.4 cM on chromosome 3 (chr3), 34.4&#x2013;37.5 cM on chr11, 782.9&#x2013;786.6 cM on chr3, 787.6&#x2013;788.2 cM on chr3, 244.6&#x2013;253 cM on ch11, 204.9&#x2013;217.6 cM on chr2, 11.4&#x2013;17.3 cM on chr8, and 33.6&#x2013;38 cM on chr11 (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 2</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2</xref>). Fourteen QTLs were identified to be associated with grain-size traits, including 1 for grain length (GL), 3 for grain width (GW), 6 for grain thickness (GT), 1 for length width ratio (LWR), and 3 for thousand-grain weight (TGW). These results would help in further detecting the genes from the weedy rice LM8.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Frequency distribution of the 12 agronomic traits in the F<sub>2</sub> population. <bold>(A)</bold> GL, grain length. <bold>(B)</bold> GW, grain width. <bold>(C)</bold> GT, grain thickness. <bold>(D)</bold> LWR, length to width ratio. <bold>(E)</bold> TGW, thousand-grain weight. <bold>(F)</bold> PL, panicle length. <bold>(G)</bold> PH, plant height. <bold>(H)</bold> PB, primary branch number. <bold>(I)</bold> SB, secondary branch number. <bold>(J)</bold> TN, tillering number. <bold>(K)</bold> FLL, flag leaf length. <bold>(L)</bold> FLW, flag leaf width.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g002.tif"/>
</fig>
</sec>
<sec id="S3.SS2">
<title>Identification of Candidate Genes Related to Grain Length</title>
<p>LM8 has evolved to form extremely small grains that may develop new elite rice varieties to study grain shape or yield related traits. Therefore, using LM8 as the material to discover genes related to grain size is practical to enrich rice resources. We conducted a correlation analysis among the grain-size traits QTLs, including grain length, grain width, grain thickness, length to width ratio, and thousand-grain weight. Significant positive correlations (<italic>P</italic> &#x003C; 0.05) were observed among grain length, length to width ratio, and thousand-grain weight, indicating that grain length has significant impact on grain size (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 3</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 3</xref>). One QTL related to grain length was located at 788.3&#x2013;789.4 cM on chr3, corresponding to a 60-kb interval harboring seven putative genes, which included 3 RAPdb annotated genes (<italic>ORUFILM03g000091</italic>, <italic>ORUFILM03g000095</italic>, <italic>ORUFILM03g000096</italic>) and 4 unknown function annotations (<italic>ORUFILM03g000090</italic>, <italic>ORUFILM03g000092</italic>, <italic>ORUFILM03g000093</italic>, <italic>ORUFILM03g000094</italic>) were important candidate genes controlling grain length (<xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 4</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>QTL for grain length and prediction of candidate genes. <bold>(A)</bold> QTL mapping results for grain length and seven putative genes (<italic>ORUFILM03g000096</italic>, <italic>ORUFILM03g000095</italic>, <italic>ORUFILM03g000094</italic>, <italic>ORUFILM03g000093</italic>, <italic>ORUFILM03g000092</italic>, <italic>ORUFILM03g000091</italic>, and <italic>ORUFILM03g000090</italic>) within the region. <bold>(B)</bold> Gene structure of <italic>ORUFILM03g000095</italic> (top), <bold>(C)</bold> grain length (GL) distribution in each genotype of <italic>ORUFILM03g000095</italic>, <bold>(D)</bold> corresponding GL phenotypes in F<sub>2</sub> individuals (lower right). Asterisks is correlation between genotype and phenotype, &#x002A;<italic>P</italic> &#x003C; 0.05. &#x002A;&#x002A;<italic>P</italic> &#x003C; 0.01.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g003.tif"/>
</fig>
<p><italic>OsCLG1</italic> (<xref ref-type="bibr" rid="B101">Yang et al., 2021</xref>) mediate ubiquitin ligase to regulate grain length. Therefore, the candidate genes among seven candidate genes, <italic>ORUFILM03g000095</italic> is a homologous gene to <italic>Os03g0427900</italic> of <italic>Nipponbare</italic> and belongs to the U-box protein gene family, in which a U-box domain acts as a ubiquitin ligase to participate in protein degradation during the cell cycle and morphological development (<xref ref-type="bibr" rid="B71">Sharma and Taganna, 2020</xref>; <xref ref-type="bibr" rid="B101">Yang et al., 2021</xref>). To further investigate the molecular basis of the small grain phenotype in LM8, we analyzed the sequence of <italic>ORUFILM03g000095</italic> gene from LM8, Shen 08S, and their progenies and revealed a C-T SNP site, located in the 12th exon 5,339 bp downstream of the ATG start site (<xref ref-type="fig" rid="F3">Figure 3</xref>). Grain length in the F<sub>2</sub> individuals of LM8 and Shen 08S displayed a clear pattern with an order of TT &#x003E; CT &#x003E; CC (<italic>P</italic> &#x003C; <italic>0.01</italic>; <xref ref-type="fig" rid="F3">Figure 3</xref>). <italic>ORUFILM03g000095</italic> genotypes were significantly correlated to the grain length variation, suggesting that this locus plays an important role in grain size regulation. Our results suggest that <italic>ORUFILM03g000095</italic> are possible candidate genes controlling grain length. However, the underlying mechanisms of how this gene regulate grain formation remain elusive and need to be further explored.</p>
</sec>
<sec id="S3.SS3">
<title>Genome Assembly and Annotation</title>
<p>There are major differences between the morphology of weedy rice and cultivated rice (<italic>O. sativa</italic> L.). The current research on cultivated rice is relatively clear, but the research on weedy rice does not yet have a reference genome with high assembly quality. To clarify the genome characteristics of the F2 population parent (weed rice LM8), we assembled a high-quality genome. Before assembly, <italic>SOAPdenovo</italic> was used for pre-assembly. K-mer analysis (<italic>k</italic> = 17) estimated its genome size to be around 362.7 Mb, with a moderate heterozygous rate of 0.20% (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 4</xref>). However, the completeness and quality of the assembly are not ideal if the genome is assembled using the second-generation sequencing data alone. Thus, the LM8 genome was sequenced and assembled by applying a combination of diverse technologies, including Oxford Nanopore long-read sequencing, Illumina short-read sequencing, Bionano optical mapping, and Hi-C technology (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 5</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 5</xref>). A total of 77.2 Gb raw data (sequencing depth 100x) were collected from Oxford Nanopore long-read sequencing, which were then self-corrected, filtered, and polished to generate the final dataset (57.3 Gb) for genome assembly (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 6</xref>). The contig-level assembly (LM8_contig) comprised 375.3 Mb, with a contig N50 of 17.9 Mb (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 6</xref>). Approximately 98.1% ubiquitous genes in embryophyte were detected by the Benchmarking Universal Single-Copy Orthologs (BUSCO) analysis (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 7</xref>), indicating that the assembled contig was of high-completeness.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Summary of the sequencing, assembly, and annotation of the LM8 genome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Stat type</td>
<td valign="top" align="center">Number</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Assembled genome size (Gb)</td>
<td valign="top" align="center">77.2</td>
</tr>
<tr>
<td valign="top" align="left">Contig N50 (Mb)</td>
<td valign="top" align="center">17.9</td>
</tr>
<tr>
<td valign="top" align="left">Scaffold N50 (Mb)</td>
<td valign="top" align="center">30.5</td>
</tr>
<tr>
<td valign="top" align="left">Longest scaffold (Mb)</td>
<td valign="top" align="center">31.3</td>
</tr>
<tr>
<td valign="top" align="left">Anchored to chromosome (Mb)</td>
<td valign="top" align="center">375.8</td>
</tr>
<tr>
<td valign="top" align="left">Number of predicted protein-coding genes</td>
<td valign="top" align="center">36,561</td>
</tr>
<tr>
<td valign="top" align="left">Average gene length (bp)</td>
<td valign="top" align="center">3545.1</td>
</tr>
<tr>
<td valign="top" align="left">Average CDS length (bp)</td>
<td valign="top" align="center">1129.6</td>
</tr>
<tr>
<td valign="top" align="left">Average exons number per gene</td>
<td valign="top" align="center">4.4</td>
</tr>
<tr>
<td valign="top" align="left">Average exon length (bp)</td>
<td valign="top" align="center">255</td>
</tr>
<tr>
<td valign="top" align="left">Average intron length (bp)</td>
<td valign="top" align="center">705</td>
</tr>
<tr>
<td valign="top" align="left">Number of rRNAs</td>
<td valign="top" align="center">81</td>
</tr>
<tr>
<td valign="top" align="left">Number of snRNAs</td>
<td valign="top" align="center">772</td>
</tr>
<tr>
<td valign="top" align="left">Number of miRNAs</td>
<td valign="top" align="center">2,551</td>
</tr>
</tbody>
</table></table-wrap>
<p>Next, using 476.2 Gb of molecules (&#x003E; 150 kb) collected from Bionano Saphyr system, we generated an optical map for the LM8 genome, with a total size of 370.3 Mb and an N50 of 24.2 Mb. With the aid of this optical map, we further assembled LM8_contig into scaffolds (LM8_scaffold), with a total size of 375.8 Mb and a scaffold N50 of 24.1 Mb (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 6</xref>). After applying high-throughput chromosome conformation capture (Hi-C) data to orient, order, and phase these scaffolds, a total of 375.3 Mb sequences (99.85%; <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 8</xref>) were anchored onto the 12 chromosomes and the final chromosome-level genome assembly (LM8_v1) was obtained. The Hi-C heatmap separated different chromosomes and showed that the interaction intensity in the diagonal-position was higher than that in the off-diagonal-position (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 7</xref>). BUSCO analysis showed that 97.9% of the core embryophyte genes were complete in the LM8 genome assembly (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 7</xref>). In addition, 87.1% (31,810) of the predicted genes were expressed according to the transcriptome data. The above results suggest that the LM8 genome assembly is of high-quality and -completeness.</p>
<p>Repeat annotation results showed that 47.72% of the LM8 genome is composed of repetitive sequences, including 26.87% retrotransposons and 20.85% DNA transposons. About 94.08% of retrotransposons are long terminal repeats (LTRs), accounting for 25.28% of the genome. The two most frequent types of LTRs are <italic>Copia</italic> and <italic>Gypsy</italic>, accounting for 2.99 and 19.62%, respectively (<xref ref-type="fig" rid="F4">Figure 4</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 9</xref>). Besides, through a comprehensive strategy combining results obtained from <italic>de novo</italic>, homology-based, and transcriptome-based prediction, 36,561 protein-coding genes were annotated in the LM8 genome. These protein-coding genes have an average length of 3,545.1 bp, an average coding sequence length of 1,129.6 bp, an average exon length of 255.2 bp, an average intron length of 705.1 bp, and an average exon number per gene of 4.4 (<xref ref-type="table" rid="T1">Table 1</xref>). Among these annotated genes, 34,773 (95.91%) were functionally annotated by at least one of the Swiss-Prot, KEGG, and InterPro databases (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 10</xref>). In addition, homology-based annotation of non-coding RNAs (ncRNAs) predicted 2,551 microRNAs (miRNAs), 81 ribosomal RNAs (rRNAs), and 772 small nuclear RNAs (snRNAs; <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 11</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>The morphology and genome features of LM8. <bold>(A)</bold> Whole plants, bar = 10 cm. <bold>(B)</bold> Panicles, bar = 2 cm. <bold>(C)</bold> Grains, bar = 1 cm. <bold>(D)</bold> Genome features of LM8. Circles from inside to outside are transposable element (TE) content, repeat density, gene density, and GC density.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g004.tif"/>
</fig>
</sec>
<sec id="S3.SS4">
<title>Comparative Analysis</title>
<p>To reveal the evolutionary relationship of the weedy rice LM8, 4,241 single-copy orthologous genes of LM8 and those from other 17 <italic>Oryza</italic> genomes were used to construct a phylogenetic tree by the maximum-likelihood (ML) method (<xref ref-type="fig" rid="F5">Figure 5</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 12</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 8</xref>). The phylogenetic tree demonstrated that LM8 diverged from the ancestor <italic>O. rufipogon</italic> &#x223C; 0.32 million years ago (Mya; <xref ref-type="fig" rid="F5">Figure 5</xref>) and was clustered into a group with <italic>japonica</italic>, indicating LM8 is more closely related to <italic>japonica</italic> compared to <italic>indica</italic>. Additionally, genome collinearity analyses conducted between LM8 and two cultivated rice varieties revealed that the LM8 genome had more collinear genes with <italic>japonica</italic> var. Nipponbare (47,439/78,939; 60.1%) than <italic>indica</italic> var. R498 (34,750/74,110; 46.89%; <xref ref-type="fig" rid="F6">Figure 6</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 9</xref>). Collectively, we speculate that LM8 belongs to <italic>japonica</italic>-type weedy rice.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Comparative genomics analyses of LM8 with other <italic>Oryza</italic> genomes. <bold>(A)</bold> Statistics of gene families in 18 <italic>Oryza</italic> genomes. <bold>(B)</bold> Core and dispensable genes from five reference genomes. The numbers in the species section and overlapping section indicate the numbers of specific and shared gene families, respectively. IND, <italic>O. sativa</italic> ssp. <italic>indica</italic>. JAP, <italic>O. sativa</italic> ssp. <italic>japonica</italic>. RUF, <italic>O. rufipogon</italic>. NIV, <italic>O. nivara</italic>. and LM8, <italic>O. sativa</italic> f. <italic>spontanea</italic>. <bold>(C)</bold> Phylogenetic relationships and grain phenotypes of LM8 and other <italic>Oryza</italic> genomes. Pie charts represent total gene families, consisting of contracted gene families (red), expanded gene families (green), and unchanged gene families (blue). The numbers of genes in expanded (+) and contracted (&#x2013;) gene families in each rice variety are shown with the rice variety name farthest to the right. The lineage divergence times are indicated on the nodes and nodes marked in red are known fossil time points. <italic>O. brachyantha</italic> was used as the outgroup. MRCA, most recent common ancestor. AUS, <italic>O. aus</italic>. IND, <italic>O. sativa</italic> ssp. <italic>indica</italic>. JAP, <italic>O. sativa</italic> ssp. <italic>japonica</italic>. GLA, <italic>O. glaberrima</italic>. BAR, <italic>O. barthii</italic>. GLU, <italic>O. glumaepatula</italic>. MER, <italic>O. meridionalis</italic>. RUF, <italic>O. rufipogon</italic>. NIV, <italic>O. nivara</italic>. LON, <italic>O. longistaminata</italic>. PUN, <italic>O. punctata</italic>. BRA, <italic>O. brachyantha</italic>. JX-6, <italic>O. rufipogon</italic> var. JX-6. Z59, <italic>O. rufipogon</italic> var. Z59. MH63, <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Minghui63. ZS97, <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Zhenshan97. R498, <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Shuihui498. and LM8, <italic>O. sativa</italic> f. <italic>spontanea</italic>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Collinearity between LM8 and two cultivated rice (JAP and R498) genomes. <bold>(A)</bold> Collinearity between JAP and LM8. <bold>(B)</bold> Collinearity between R498 and LM8.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g006.tif"/>
</fig>
<p>By comparing LM8 with four other rice species including <italic>O. nivara</italic> (NIV), <italic>O. sativa</italic> ssp. <italic>indica</italic> (IND), <italic>O. sativa</italic> ssp. <italic>japonica</italic> (JAP), and <italic>O. rufipogon</italic> (RUF), we found that 68.4% (17,403/25,430) of the gene families in LM8 were shared among all five species, while approximately 12.4% (3,143/25,430) were specific to LM8 (<xref ref-type="fig" rid="F5">Figure 5</xref>). The closer the relationship indicated by the phylogenetic tree, the more the shared gene families (<xref ref-type="fig" rid="F7">Figure 7</xref>). Among the 18 <italic>Oryza</italic> genomes, 2,875 unclustered genes and 672 unique genes were observed in the LM8 genome (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 12</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 8</xref>). The proteins encoded by these unique genes related to the formation of grain length, heading date and tillering number including serine/threonine-protein phosphatases (<italic>ORUFILM03g000947</italic>), photosystem II reaction center proteins (<italic>ORUFILM08g001423</italic>), and zinc finger MYM-type proteins (<italic>ORUFILM03g000136</italic>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Venn diagrams showing specific and shared gene families between LM8 and other <italic>Oryza</italic> genomes in the same cluster of the evolution tree. <bold>(A)</bold> JAP, RUF, JX6, Z59 and LM8. <bold>(B)</bold> LON, MER, PUN, BRA and LM8. <bold>(C)</bold> MH63, R498, ZS97 and LM8. <bold>(D)</bold> AUS, NIV, IND and LM8. <bold>(E)</bold> BAR, GLU, GLA, and LM8. AUS, <italic>O. aus</italic>. IND, <italic>O. sativa</italic> ssp. <italic>indica</italic>. JAP, <italic>O. sativa</italic> ssp. <italic>japonica</italic>. GLA, <italic>O. glaberrima</italic>. BAR, <italic>O. barthii</italic>. GLU, <italic>O. glumaepatula</italic>. MER, <italic>O. meridionalis</italic>. RUF, <italic>O. rufipogon</italic>. NIV, <italic>O. nivara</italic>. LON, <italic>O. longistaminata</italic>. PUN, <italic>O. punctata</italic>. BRA, <italic>O. brachyantha</italic>. JX-6, <italic>O. rufipogon</italic> var. JX-6. Z59, <italic>O. rufipogon</italic> var. Z59. MH63, <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Minghui63. ZS97, <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Zhenshan97. R498, <italic>O. sativa</italic> ssp. <italic>indica</italic> var. Shuihui498. and LM8, <italic>O. sativa</italic> f. <italic>spontanea</italic>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g007.tif"/>
</fig>
</sec>
<sec id="S3.SS5">
<title>Gene Family Analysis</title>
<p>Gene family expansion/contraction has been shown to be associated with domestication and ecological adaptation (<xref ref-type="bibr" rid="B64">Peng et al., 2019</xref>; <xref ref-type="bibr" rid="B107">Zeng et al., 2019</xref>). To characterize the LM8 genome, a genome-wide comparative genomics analysis was performed among 18 <italic>Oryza</italic> genomes (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 13</xref>). We assigned 36,561 LM8 genes to 25,430 gene families (<xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 14</xref>). Relative to the common ancestor of rice (<italic>O. rufipogon</italic>), 16.06% (4,086/25,430) expansion and 28.73% (7307/25,430) contracted gene families were observed (<xref ref-type="fig" rid="F5">Figure 5</xref> and <xref ref-type="supplementary-material" rid="DS2">Supplementary Table 14</xref>). The expansion gene families included 12793 expansion genes, of which 213 QTL mapping genes belonged to the expanded gene family. In the expanded gene families, Gene Ontology (GO) enrichment analysis revealed 295 GO terms involving biological process (BP), cellular component (CC), and molecular function (MP). Sixty-seven pathways were significantly enriched, including carbohydrate metabolic process, signal transduction, and cell growth (<xref ref-type="fig" rid="F8">Figure 8</xref>). The significantly enriched genes may contribute to the adaptability of LM8 to complex environments during evolution. Meanwhile, we found 57 genes among the QTL mapping were detected by GO enrichment and enriched into 20 pathways including catalytic activity, proteolysis, and transmembrane transport protein activity (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 15</xref>). A total of 168 positive selection genes (PSGs) were identified and annotated to be auxin response proteins (e.g., <italic>ORUFILM02g003288</italic>), cell division control proteins (e.g., <italic>ORUFILM01g004046</italic>), and ubiquitin-protein ligase E3 UPL4 (e.g., <italic>ORUFILM05g002772</italic>), which may participate in the regulation of grain growth process and grain formation (<xref ref-type="bibr" rid="B53">Luo et al., 2013</xref>; <xref ref-type="bibr" rid="B5">Basunia et al., 2021</xref>). Nevertheless, whether these PSGs can explain the difference in the grain size need to be further explored.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption><p>Statistics of the GO enrichment analysis of the expanded gene families. The <italic>x</italic>-axis represents the percentage of enriched genes to the total annotated genes. The <italic>y</italic>-axis indicates the entry of each enrichment category. The size of the dots corresponds to the number of enriched genes, and the color panel on the right indicates the <italic>q</italic>-value. The lower the value, the more significant it is.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-12-775051-g008.tif"/>
</fig>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>Discussion</title>
<p>With the development of sequencing techniques and corresponding analysis approaches, the sequencing speed and quality have greatly improved, while the cost has decreased tremendously, allowing a growing number of genomes to be sequenced and applied to related studies. The combination of a specific chromosome-level genome assembly and a high-density genetic map has been verified to be effective to map QTLs or locate genes associated with important agronomic traits (<xref ref-type="bibr" rid="B54">Luo et al., 2020</xref>) and has been widely applied to various important crops including cotton (<xref ref-type="bibr" rid="B90">Wang F. et al., 2020</xref>), peanut (<xref ref-type="bibr" rid="B1">Agarwal et al., 2018</xref>), <italic>Cucumis melo</italic> (<xref ref-type="bibr" rid="B25">Hu et al., 2018</xref>), pear (<xref ref-type="bibr" rid="B45">Li et al., 2019</xref>). In rice, <xref ref-type="bibr" rid="B46">Li et al. (2018)</xref> constructed a high-density genetic map through performing whole-genome resequencing and identified a candidate gene (<italic>DEP1</italic>) in determining panicle length. Later, <xref ref-type="bibr" rid="B84">Sun et al. (2019)</xref> constructed a genetic map and located a region on chr1 contributing to seed shattering, awn length, and plant height. In this study, we generated a chromosome-level genome assembly and constructed a high-density genetic map with the help of high-throughput sequencing approaches, we identified <italic>ORUFILM03g000095</italic> gene on chr3 that may regulate grain length (<xref ref-type="fig" rid="F3">Figure 3</xref>). We have analyzed the candidate gene based on 3K genome data which is important research in rice genomics research (<xref ref-type="bibr" rid="B94">Wang et al., 2018</xref>; <xref ref-type="bibr" rid="B89">Wang C. et al., 2020</xref>), but the same haplotype as LM8 was not found in 3K data, so we did not further analyze it (<xref ref-type="supplementary-material" rid="DS2">Supplementary Table 16</xref>). This study would not only lay a foundation for rapid discovery of genes from weedy rice but also broaden the understanding of weedy rice utilization on rice genetic improvement. Large number of candidate genes were obtained in this study and those excellent gene could improve the breeding value of cultivated rice. Next step studying of the function of the candidate gene can use gene knockout, mutation analysis, overexpression analysis, genetic complementation, and other experiments to further verify whether the candidate gene can be used to improve cultivated rice.</p>
<p>The <italic>Oryza</italic> genus is generally believed to include 22 wild and 2 cultivated rice species based on morphological characteristics (<xref ref-type="bibr" rid="B34">Jacquemin et al., 2014</xref>). Asian cultivated rice (<italic>O. sativa</italic> L.), an important staple crop, is widely planted around the world and has formed extremely rich genetic diversity during the long evolutionary process. In <italic>O. sativa</italic>, the two subspecies (i.e., <italic>indica</italic> and <italic>japonica</italic>) differ in morphology, anatomical structure, physiological and biochemical characteristics, and genome sequence, and their origins remain controversial (<xref ref-type="bibr" rid="B72">Shinobu et al., 2002</xref>; <xref ref-type="bibr" rid="B87">Vaughan et al., 2007</xref>). The single-origin theory believes that <italic>indica</italic> and <italic>japonica</italic> both derived from <italic>O. rufipogon</italic> and diverged during the long-term domestication and artificial selection (<xref ref-type="bibr" rid="B9">Chang, 1976</xref>; <xref ref-type="bibr" rid="B111">Zhu and Ge, 2005</xref>). By contrast, the multi-origin theory believes that <italic>indica</italic> originated from <italic>O. nivara</italic> in eastern India, while <italic>japonica</italic> originated from <italic>O. rufipogon</italic> in the Yangtze River region of China (<xref ref-type="bibr" rid="B62">Oka, 1974</xref>; <xref ref-type="bibr" rid="B50">Londo et al., 2006</xref>; <xref ref-type="bibr" rid="B26">Huang et al., 2012</xref>; <xref ref-type="bibr" rid="B86">Sun et al., 2015</xref>), and the divergence between <italic>indica</italic> and <italic>japonica</italic> subspecies occurred 0.4 Mya (<xref ref-type="bibr" rid="B39">Kumagai et al., 2010</xref>; <xref ref-type="bibr" rid="B10">Chen et al., 2012</xref>). Our phylogenetic analysis showed that <italic>O. nivara</italic> and <italic>O. rufipogon</italic> were present in two separate branches, supporting the evolutionary model of multiple origins. LM8 was originated approximately 0.32 Mya and harbors morphological characteristics specific to wild rice such as shattering, hard glumes, and small grains (<xref ref-type="fig" rid="F5">Figure 5</xref>). Thus, it could be concluded that LM8 is a kind of <italic>japonica</italic>-type weedy rice from a cross between <italic>japonica</italic> and wild rice, which confirmed the result of taxonomic study.</p>
<p>Chromosome-level genome assemblies may generally accelerate gene discovery in crops to improve yield, quality, and disease resistance (<xref ref-type="bibr" rid="B68">Rao et al., 2014</xref>; <xref ref-type="bibr" rid="B67">Qian et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Bai et al., 2018</xref>). As genome assemblies of Asian cultivated rice varieties such as MH63, ZH97, and R498 become available, a large number of structural variations have been successfully obtained, which would have a wide-range impact on crop genetic improvement (<xref ref-type="bibr" rid="B108">Zhang et al., 2016</xref>; <xref ref-type="bibr" rid="B16">Du et al., 2017</xref>). For example, <xref ref-type="bibr" rid="B110">Zhang et al. (2014)</xref> assembled five AA-genome rice species and identified 14 PSGs that are closely related to rice flowering, development, reproduction, biotic and abiotic resistance through comparative genomics analyses. Although many genomes have been assembled in the <italic>Oryza</italic> genus, only one of them belongs to weedy rice (WRAH), which was used to discuss the origin of weedy rice (<xref ref-type="bibr" rid="B84">Sun et al., 2019</xref>). In this study, we reported another weedy rice (LM8) genome for the purpose of identifying genes. This chromosome-level genome assembly contains 672 unique genes specific to weedy rice compared with other 17 <italic>Oryza</italic> genomes (<xref ref-type="fig" rid="F5">Figure 5</xref>). Besides, the comparison of the contig N50 (6.09 Mb in WRAH and 17.86 Mb in LM8) and sequence gaps (94 in WRAH and 25 in LM8; <xref ref-type="table" rid="T1">Table 1</xref>) between these two weedy rice genomes (<xref ref-type="bibr" rid="B84">Sun et al., 2019</xref>) indicates the high-quality LM8 genome assembly is able to serve as a reference for accelerating the identification of genes from weedy rice, thus improving the cultivated rice varieties.</p>
</sec>
<sec id="S5" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are publicly available. This data can be found here: National Center for Biotechnology Information (NCBI) BioProject database under accession number <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA754271">PRJNA754271</ext-link>.</p>
</sec>
<sec id="S6">
<title>Author Contributions</title>
<p>FL performed the experiments. FL and ZH conducted data analyses and wrote the manuscript. WQ contributed to construct of genetic population and experimental guidance. JW, YS, YCu, JL, JG, DLo, and WF contributed to help data analyses. DLi, BN, ZZ, YCh, and LZ contributed to the material preparation, collection, and measurement. QY and XZ designed the experiment and revised the manuscript. All authors read and approved the final manuscript.</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="pudiscl1" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec id="S7" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by the National Natural Science Foundation of China (31970237), the Science and Technology Innovation Project of Chinese Academy of Agricultural Sciences (2060302-2), the Sanya Yazhou Bay Science and Technology City (SKJC-2020-02-001), and the Fundamental Research Funds (S2021ZD01).</p>
</sec>
<ack>
<p>We acknowledge the Anhui Academy of Agricultural Sciences for kindly providing the cultivated rice variety &#x201C;Shen 08S.&#x201D; We appreciate the linguistic assistance provided by TopEdit (<ext-link ext-link-type="uri" xlink:href="http://www.topeditsci.com">www.topeditsci.com</ext-link>) during preparation of this manuscript.</p>
</ack>
<sec id="S9" sec-type="supplementary-material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2021.775051/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2021.775051/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="DS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.docx" id="DS2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agarwal</surname> <given-names>G.</given-names></name> <name><surname>Clevenger</surname> <given-names>J.</given-names></name> <name><surname>Pandey</surname> <given-names>M. K.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name> <name><surname>Shasidhar</surname> <given-names>Y.</given-names></name> <name><surname>Chu</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>High-density genetic map using whole-genome re-sequencing for fine mapping and candidate gene discovery for disease resistance in peanut.</article-title> <source><italic>Plant Biotechnol. J.</italic></source> <volume>16</volume> <fpage>1954</fpage>&#x2013;<lpage>1967</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.12930</pub-id> <pub-id pub-id-type="pmid">29637729</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bai</surname> <given-names>S.</given-names></name> <name><surname>Yu</surname> <given-names>H.</given-names></name> <name><surname>Wang</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>Retrospective and perspective of rice breeding in China.</article-title> <source><italic>J. Genet. Geno.</italic></source> <volume>45</volume> <fpage>603</fpage>&#x2013;<lpage>612</lpage>. <pub-id pub-id-type="doi">10.1016/j.jgg.2018.10.002</pub-id> <pub-id pub-id-type="pmid">30449538</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baker</surname> <given-names>H. G.</given-names></name></person-group> (<year>1974</year>). <article-title>The evolution of weeds.</article-title> <source><italic>Annu. Rev. Ecol. Syst.</italic></source> <volume>5</volume> <fpage>1</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.es.05.110174.000245</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bao</surname> <given-names>W.</given-names></name> <name><surname>Kojima</surname> <given-names>K. K.</given-names></name> <name><surname>Kohany</surname> <given-names>O.</given-names></name></person-group> (<year>2015</year>). <article-title>Repbase update, a database of repetitive elements in eukaryotic genomes.</article-title> <source><italic>Mobile DNA</italic></source> <volume>6</volume>:<fpage>11</fpage>. <pub-id pub-id-type="doi">10.1186/s13100-015-0041-9</pub-id> <pub-id pub-id-type="pmid">26045719</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Basunia</surname> <given-names>M. A.</given-names></name> <name><surname>Nonhebel</surname> <given-names>H. M.</given-names></name> <name><surname>Backhouse</surname> <given-names>D.</given-names></name> <name><surname>Mcmillan</surname> <given-names>M.</given-names></name></person-group> (<year>2021</year>). <article-title>Localised expression of OsIAA29 suggests a key role for auxin in regulating development of the dorsal aleurone of early rice grains.</article-title> <source><italic>BioRxiv [prperint].</italic></source> <pub-id pub-id-type="doi">10.1007/s00425-021-03688-z</pub-id> <pub-id pub-id-type="pmid">34324072</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Benson</surname> <given-names>G.</given-names></name></person-group> (<year>1999</year>). <article-title>Tandem repeats finder: a program to analyze DNA sequences.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>27</volume> <fpage>573</fpage>&#x2013;<lpage>580</lpage>. <pub-id pub-id-type="doi">10.1093/nar/27.2.573</pub-id> <pub-id pub-id-type="pmid">9862982</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Burton</surname> <given-names>J. N.</given-names></name> <name><surname>Adey</surname> <given-names>A.</given-names></name> <name><surname>Patwardhan</surname> <given-names>R. P.</given-names></name> <name><surname>Qiu</surname> <given-names>R.</given-names></name> <name><surname>Kitzman</surname> <given-names>J. O.</given-names></name> <name><surname>Shendure</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Chromosome-scale scaffolding of de novo genome assemblies based on chromatin interactions.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>31</volume> <fpage>1119</fpage>&#x2013;<lpage>1125</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.2727</pub-id> <pub-id pub-id-type="pmid">24185095</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cali</surname> <given-names>D. S.</given-names></name> <name><surname>Kim</surname> <given-names>J. S.</given-names></name> <name><surname>Ghose</surname> <given-names>S.</given-names></name> <name><surname>Alkan</surname> <given-names>C.</given-names></name> <name><surname>Mutlu</surname> <given-names>O.</given-names></name></person-group> (<year>2018</year>). <article-title>Nanopore sequencing technology and tools: computational analysis of the current state, bottlenecks, and future directions.</article-title> <source><italic>Brief. Bioinform.</italic></source> <volume>20</volume> <fpage>1542</fpage>&#x2013;<lpage>1559</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bby017</pub-id> <pub-id pub-id-type="pmid">29617724</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chang</surname> <given-names>T. T.</given-names></name></person-group> (<year>1976</year>). <article-title>The origin, evolution, cultivation, dissemination, and diversification of Asian and African rices.</article-title> <source><italic>Euphytica</italic></source> <volume>25</volume> <fpage>425</fpage>&#x2013;<lpage>441</lpage>. <pub-id pub-id-type="doi">10.1007/BF00041576</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Huang</surname> <given-names>Q.</given-names></name> <name><surname>Gao</surname> <given-names>D.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Lang</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Whole-genome sequencing of <italic>Oryza brachyantha</italic> reveals mechanisms underlying <italic>Oryza genome</italic> evolution.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>4</volume>:<fpage>1595</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms2596</pub-id> <pub-id pub-id-type="pmid">23481403</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>S.</given-names></name> <name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Zhou, Chen</surname> <given-names>Y.</given-names></name> <name><surname>Gu</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>Fastp: an ultra-fast all-in-one FASTQ preprocessor.</article-title> <source><italic>Bioinformatics</italic></source> <volume>34</volume> <fpage>i884</fpage>&#x2013;<lpage>i890</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bty560</pub-id> <pub-id pub-id-type="pmid">30423086</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cho</surname> <given-names>Y.</given-names></name> <name><surname>Chung</surname> <given-names>T.</given-names></name> <name><surname>Suh</surname> <given-names>H.</given-names></name></person-group> (<year>1995</year>). <article-title>Genetic characteristics of Korean weedy rice (<italic>Oryza sativa</italic> L.) by RFLP analysis.</article-title> <source><italic>Euphytica</italic></source> <volume>86</volume> <fpage>103</fpage>&#x2013;<lpage>110</lpage>. <pub-id pub-id-type="doi">10.1007/BF00022015</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cui</surname> <given-names>Y.</given-names></name> <name><surname>Song</surname> <given-names>B.</given-names></name> <name><surname>Li</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Huang</surname> <given-names>Z.</given-names></name> <name><surname>Caicedo</surname> <given-names>A. L.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Little white lies: pericarp color provides insights into the origins and evolution of Southeast Asian weedy rice.</article-title> <source><italic>G3: Genes Genomes Genet</italic></source> <volume>6</volume> <fpage>4105</fpage>&#x2013;<lpage>4114</lpage>. <pub-id pub-id-type="doi">10.1534/g3.116.035881</pub-id> <pub-id pub-id-type="pmid">27729434</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dai</surname> <given-names>L.</given-names></name> <name><surname>Dai</surname> <given-names>W.</given-names></name> <name><surname>Song</surname> <given-names>X.</given-names></name> <name><surname>Lu</surname> <given-names>B.</given-names></name> <name><surname>Qiang</surname> <given-names>S.</given-names></name></person-group> (<year>2013</year>). <article-title>A comparative study of competitiveness between different genotypes of weedy rice (<italic>Oryza sativa</italic>) and cultivated rice.</article-title> <source><italic>Pest Manage. Sci.</italic></source> <volume>70</volume> <fpage>113</fpage>&#x2013;<lpage>122</lpage>. <pub-id pub-id-type="doi">10.1002/ps.3534</pub-id> <pub-id pub-id-type="pmid">23512472</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Bie</surname> <given-names>T.</given-names></name> <name><surname>Cristianini</surname> <given-names>N.</given-names></name> <name><surname>Demuth</surname> <given-names>J. P.</given-names></name> <name><surname>Hahn</surname> <given-names>M. W.</given-names></name></person-group> (<year>2006</year>). <article-title>CAFE: a computational tool for the study of gene family evolution.</article-title> <source><italic>Bioinformatics</italic></source> <volume>22</volume> <fpage>1269</fpage>&#x2013;<lpage>1271</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btl097</pub-id> <pub-id pub-id-type="pmid">16543274</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Du</surname> <given-names>H.</given-names></name> <name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Ma</surname> <given-names>Y.</given-names></name> <name><surname>Gao</surname> <given-names>Q.</given-names></name> <name><surname>Cao</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Sequencing and de novo assembly of a near complete indica rice genome.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>8</volume> <fpage>15324</fpage>&#x2013;<lpage>15336</lpage>. <pub-id pub-id-type="doi">10.1038/ncomms15324</pub-id> <pub-id pub-id-type="pmid">28469237</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dudchenko</surname> <given-names>O.</given-names></name> <name><surname>Batra</surname> <given-names>S. S.</given-names></name> <name><surname>Omer</surname> <given-names>A. D.</given-names></name> <name><surname>Nyquist</surname> <given-names>S. K.</given-names></name> <name><surname>Hoeger</surname> <given-names>M.</given-names></name> <name><surname>Durand</surname> <given-names>N. C.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>De novo assembly of the <italic>Aedes aegypti</italic> genome using Hi-C yields chromosome-length scaffolds.</article-title> <source><italic>Science</italic></source> <volume>356</volume> <fpage>92</fpage>&#x2013;<lpage>95</lpage>. <pub-id pub-id-type="doi">10.1126/science.aal3327</pub-id> <pub-id pub-id-type="pmid">28336562</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fan</surname> <given-names>C.</given-names></name> <name><surname>Xing</surname> <given-names>Y.</given-names></name> <name><surname>Mao</surname> <given-names>H.</given-names></name> <name><surname>Lu</surname> <given-names>T.</given-names></name> <name><surname>Han</surname> <given-names>B.</given-names></name> <name><surname>Xu</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>GS3, a major QTL for grain length and weight and minor QTL for grain width and thickness in rice, encodes a putative transmembrane protein.</article-title> <source><italic>Theoretical Appl. Genet.</italic></source> <volume>112</volume> <fpage>1164</fpage>&#x2013;<lpage>1171</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-006-0218-1</pub-id> <pub-id pub-id-type="pmid">16453132</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Goff</surname> <given-names>S. A.</given-names></name> <name><surname>Ricke</surname> <given-names>D.</given-names></name> <name><surname>Lan</surname> <given-names>T. H.</given-names></name> <name><surname>Presting</surname> <given-names>G.</given-names></name> <name><surname>Wang</surname> <given-names>R.</given-names></name> <name><surname>Dunn</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2002</year>). <article-title>A draft sequence of the rice genome (<italic>Oryza sativa</italic> L. ssp. japonica).</article-title> <source><italic>Science</italic></source> <volume>296</volume> <fpage>92</fpage>&#x2013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1126/science.1068275</pub-id> <pub-id pub-id-type="pmid">11935018</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Griffiths-Jones</surname> <given-names>S.</given-names></name> <name><surname>Moxon</surname> <given-names>S.</given-names></name> <name><surname>Marshall</surname> <given-names>M.</given-names></name> <name><surname>Khanna</surname> <given-names>A.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name> <name><surname>Bateman</surname> <given-names>A.</given-names></name></person-group> (<year>2005</year>). <article-title>Rfam: annotating non-coding RNAs in complete genomes.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>33</volume> <fpage>D121</fpage>&#x2013;<lpage>D124</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gki081</pub-id> <pub-id pub-id-type="pmid">15608160</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Delcher</surname> <given-names>A. L.</given-names></name> <name><surname>Mount</surname> <given-names>S. M.</given-names></name> <name><surname>Wortman</surname> <given-names>J. R.</given-names></name> <name><surname>Smith</surname> <given-names>J. R. K.</given-names></name> <name><surname>Hannick</surname> <given-names>L. I.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>Improving the <italic>Arabidopsis</italic> genome annotation using maximal transcript alignment assemblies.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>31</volume> <fpage>5654</fpage>&#x2013;<lpage>5666</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkg770</pub-id> <pub-id pub-id-type="pmid">14500829</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name> <name><surname>Zhu</surname> <given-names>W.</given-names></name> <name><surname>Pertea</surname> <given-names>M.</given-names></name> <name><surname>Allen</surname> <given-names>J. E.</given-names></name> <name><surname>Orvis</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Automated eukaryotic gene structure annotation using evidencemodeler and the program to assemble spliced alignments.</article-title> <source><italic>Genome Biol.</italic></source> <volume>9</volume>:<fpage>R7</fpage>. <pub-id pub-id-type="doi">10.1186/gb-2008-9-1-r7</pub-id> <pub-id pub-id-type="pmid">18190707</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Han</surname> <given-names>B.</given-names></name> <name><surname>Xue</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Deng</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>Q.</given-names></name></person-group> (<year>2007</year>). <article-title>Rice functional genomics research in China.</article-title> <source><italic>Philos. Trans. R. Soc. Lond. Ser. B: Biol. Sci.</italic></source> <volume>362</volume> <fpage>1009</fpage>&#x2013;<lpage>1021</lpage>. <pub-id pub-id-type="doi">10.1098/rstb.2007.2030</pub-id> <pub-id pub-id-type="pmid">17347106</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>J.</given-names></name> <name><surname>Fan</surname> <given-names>J.</given-names></name> <name><surname>Sun</surname> <given-names>Z.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>NextPolish: a fast and efficient genome polishing tool for long-read assembly.</article-title> <source><italic>Bioinformatics</italic></source> <volume>36</volume> <fpage>2253</fpage>&#x2013;<lpage>2255</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz891</pub-id> <pub-id pub-id-type="pmid">31778144</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>Z.</given-names></name> <name><surname>Deng</surname> <given-names>G.</given-names></name> <name><surname>Mou</surname> <given-names>H.</given-names></name> <name><surname>Xu</surname> <given-names>Y.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>A re-sequencing-based ultra-dense genetic map reveals a gummy stem blight resistance-associated gene in Cucumis melo.</article-title> <source><italic>DNA Res.</italic></source> <volume>225</volume> <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/dsx033</pub-id> <pub-id pub-id-type="pmid">28985339</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>P.</given-names></name> <name><surname>Molina</surname> <given-names>J.</given-names></name> <name><surname>Flowers</surname> <given-names>J. M.</given-names></name> <name><surname>Rubinstein</surname> <given-names>S.</given-names></name> <name><surname>Schaal</surname> <given-names>B. A.</given-names></name> <name><surname>Purugganan</surname> <given-names>M. D.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Phylogeography of Asian wild rice, <italic>Oryza rufipogon</italic>: a genome-wide view.</article-title> <source><italic>Mol. Ecol.</italic></source> <volume>21</volume> <fpage>4593</fpage>&#x2013;<lpage>4604</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-294X.2012.05625.x</pub-id> <pub-id pub-id-type="pmid">22646149</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Qian</surname> <given-names>Q.</given-names></name> <name><surname>Liu</surname> <given-names>Z.</given-names></name> <name><surname>Sun</surname> <given-names>H.</given-names></name> <name><surname>He</surname> <given-names>S.</given-names></name> <name><surname>Luo</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Natural variation at the DEP1 locus enhances grain yield in rice.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>41</volume> <fpage>494</fpage>&#x2013;<lpage>497</lpage>. <pub-id pub-id-type="doi">10.1038/ng.352</pub-id> <pub-id pub-id-type="pmid">19305410</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Wei</surname> <given-names>X.</given-names></name> <name><surname>Sang</surname> <given-names>T.</given-names></name> <name><surname>Zhao</surname> <given-names>Q.</given-names></name> <name><surname>Feng</surname> <given-names>Q.</given-names></name> <name><surname>Zhao</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Genome-wide association studies of 14 agronomic traits in rice landraces.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>42</volume> <fpage>961</fpage>&#x2013;<lpage>967</lpage>. <pub-id pub-id-type="doi">10.1038/ng.695</pub-id> <pub-id pub-id-type="pmid">20972439</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name> <name><surname>Gong</surname> <given-names>J.</given-names></name> <name><surname>Zhao</surname> <given-names>Y.</given-names></name> <name><surname>Feng</surname> <given-names>Q.</given-names></name> <name><surname>Gong</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Genomic analysis of hybrid rice varieties reveals numerous superior alleles that contribute to heterosis.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>6</volume> <fpage>6258</fpage>&#x2013;<lpage>6267</lpage>. <pub-id pub-id-type="doi">10.1038/ncomms7258</pub-id> <pub-id pub-id-type="pmid">25651972</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Zhao</surname> <given-names>Y.</given-names></name> <name><surname>Wei</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>A.</given-names></name> <name><surname>Zhao</surname> <given-names>Q.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Genome-wide association study of filowering time and grain yield traits in a worldwide collectionof rice germplasm.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>44</volume> <fpage>32</fpage>&#x2013;<lpage>39</lpage>. <pub-id pub-id-type="doi">10.1038/ng.1018</pub-id> <pub-id pub-id-type="pmid">22138690</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hunter</surname> <given-names>S.</given-names></name> <name><surname>Apweiler</surname> <given-names>R.</given-names></name> <name><surname>Attwood</surname> <given-names>T. K.</given-names></name> <name><surname>Bairoch</surname> <given-names>A.</given-names></name> <name><surname>Bateman</surname> <given-names>A.</given-names></name> <name><surname>Binns</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>InterPro: the integrative protein signature database.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>37</volume> <fpage>D211</fpage>&#x2013;<lpage>D215</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkn785</pub-id> <pub-id pub-id-type="pmid">18940856</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><collab>International Wheat Genome Sequencing Consortium [IWGSC]</collab> (<year>2014</year>). <article-title>A chromosome-based draft sequence of the hexaploid bread wheat (<italic>Triticum aestivum</italic>) genome.</article-title> <source><italic>Science</italic></source> <volume>345</volume>:<fpage>1251788</fpage>. <pub-id pub-id-type="doi">10.1126/science.1251788</pub-id> <pub-id pub-id-type="pmid">25035500</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ishikawa</surname> <given-names>R.</given-names></name> <name><surname>Toki</surname> <given-names>N.</given-names></name> <name><surname>Imai</surname> <given-names>K.</given-names></name> <name><surname>Sato</surname> <given-names>Y. I.</given-names></name> <name><surname>Yamagishi</surname> <given-names>H.</given-names></name> <name><surname>Shimamoto</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2005</year>). <article-title>Origin of weedy rice grown in bhutan and the force of genetic diversity.</article-title> <source><italic>Genet. Resour. Crop Evol.</italic></source> <volume>52</volume> <fpage>395</fpage>&#x2013;<lpage>403</lpage>. <pub-id pub-id-type="doi">10.1007/s10722-005-2257-x</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jacquemin</surname> <given-names>J.</given-names></name> <name><surname>Ammiraju</surname> <given-names>J. S. S.</given-names></name> <name><surname>Haberer</surname> <given-names>G.</given-names></name> <name><surname>Billheimer</surname> <given-names>D. D.</given-names></name> <name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>L. C.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Fifteen million years of evolution in the <italic>Oryza genus</italic> shows extensive gene family expansion.</article-title> <source><italic>Mol. Plant</italic></source> <volume>7</volume> <fpage>642</fpage>&#x2013;<lpage>656</lpage>. <pub-id pub-id-type="doi">10.1093/mp/sst149</pub-id> <pub-id pub-id-type="pmid">24214894</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jens</surname> <given-names>K.</given-names></name> <name><surname>Michael</surname> <given-names>W.</given-names></name> <name><surname>Jessica</surname> <given-names>E.</given-names></name> <name><surname>Martin</surname> <given-names>H. S.</given-names></name> <name><surname>Jan</surname> <given-names>G.</given-names></name> <name><surname>Frank</surname> <given-names>H.</given-names></name></person-group> (<year>2016</year>). <article-title>Using intron position conservation for homology-based gene prediction.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume>:<fpage>e89</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw092</pub-id> <pub-id pub-id-type="pmid">26893356</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname> <given-names>K.</given-names></name> <name><surname>Standley</surname> <given-names>D. M.</given-names></name></person-group> (<year>2013</year>). <article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>30</volume> <fpage>772</fpage>&#x2013;<lpage>780</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id> <pub-id pub-id-type="pmid">23329690</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khush</surname> <given-names>G. S.</given-names></name></person-group> (<year>2001</year>). <article-title>Green revolution: the way forward.</article-title> <source><italic>Nat. Rev. Genet.</italic></source> <volume>2</volume> <fpage>815</fpage>&#x2013;<lpage>822</lpage>. <pub-id pub-id-type="doi">10.1038/35093585</pub-id> <pub-id pub-id-type="pmid">11584298</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koren</surname> <given-names>S.</given-names></name> <name><surname>Walenz</surname> <given-names>B. P.</given-names></name> <name><surname>Berlin</surname> <given-names>K.</given-names></name> <name><surname>Miller</surname> <given-names>J. R.</given-names></name> <name><surname>Bergman</surname> <given-names>N. H.</given-names></name> <name><surname>Phillippy</surname> <given-names>A. M.</given-names></name></person-group> (<year>2017</year>). <article-title>Canu: scalable and accurate long-read assembly via adaptive k-mer weighting and repeat separation.</article-title> <source><italic>Genome Res.</italic></source> <volume>27</volume> <fpage>722</fpage>&#x2013;<lpage>736</lpage>. <pub-id pub-id-type="doi">10.1101/gr.215087.116</pub-id> <pub-id pub-id-type="pmid">28298431</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumagai</surname> <given-names>M.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Ueda</surname> <given-names>S.</given-names></name></person-group> (<year>2010</year>). <article-title>Genetic diversity and evolutionary relationships in genus Oryza revealed by using highly variable regions of chloroplast DNA.</article-title> <source><italic>Gene</italic></source> <volume>462</volume> <fpage>44</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2010.04.013</pub-id> <pub-id pub-id-type="pmid">20450965</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Langfelder</surname> <given-names>P.</given-names></name> <name><surname>Horvath</surname> <given-names>S.</given-names></name></person-group> (<year>2012</year>). <article-title>Fast R functions for robust correlations and hierarchical clustering.</article-title> <source><italic>J. Stat. Softw.</italic></source> <volume>46</volume>:<fpage>i11</fpage>. <pub-id pub-id-type="doi">10.18637/jss.v046.i11</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Langmead</surname> <given-names>B.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Fast gapped-read alignment with bowtie 2.</article-title> <source><italic>Nat. Methods</italic></source> <volume>9</volume> <fpage>357</fpage>&#x2013;<lpage>359</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id> <pub-id pub-id-type="pmid">22388286</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Durbin</surname> <given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>Fast and accurate short read alignment with Burrows&#x2013;Wheeler transform.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>1754</fpage>&#x2013;<lpage>1760</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id> <pub-id pub-id-type="pmid">19451168</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Handsaker</surname> <given-names>B.</given-names></name> <name><surname>Wysoker</surname> <given-names>A.</given-names></name> <name><surname>Fennell</surname> <given-names>T.</given-names></name> <name><surname>Ruan</surname> <given-names>J.</given-names></name> <name><surname>Homer</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>The sequence alignment/map format and SAMtools.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>2078</fpage>&#x2013;<lpage>2079</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp352</pub-id> <pub-id pub-id-type="pmid">19505943</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>L.</given-names></name> <name><surname>Stoeckert</surname> <given-names>C. J.</given-names> <suffix>Jr.</suffix></name> <name><surname>Roots</surname> <given-names>D. S.</given-names></name></person-group> (<year>2003</year>). <article-title>OrthoMCL: identification of ortholog groups for eukaryotic genomes.</article-title> <source><italic>Genome Res.</italic></source> <volume>13</volume> <fpage>2178</fpage>&#x2013;<lpage>2189</lpage>. <pub-id pub-id-type="doi">10.1101/gr.1224503</pub-id> <pub-id pub-id-type="pmid">12952885</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Singh</surname> <given-names>J.</given-names></name> <name><surname>Qin</surname> <given-names>M.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Development of an integrated 200K SNP genotyping array and application for genetic mapping, genome assembly improvement and genome wide association studies in pear (Pyrus).</article-title> <source><italic>Plant Biotechnol. J.</italic></source> <volume>17</volume> <fpage>1582</fpage>&#x2013;<lpage>1594</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.13085</pub-id> <pub-id pub-id-type="pmid">30690857</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Wu</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Sun</surname> <given-names>J.</given-names></name> <name><surname>Xia</surname> <given-names>X.</given-names></name> <name><surname>Geng</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Genome sequencing of rice subspecies and genetic analysis of recombinant lines reveals regional yield- and quality-associated loci.</article-title> <source><italic>BMC Biol.</italic></source> <volume>16</volume>:<fpage>102</fpage>. <pub-id pub-id-type="doi">10.1186/s12915-018-0572-x</pub-id> <pub-id pub-id-type="pmid">30227868</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Fan</surname> <given-names>C.</given-names></name> <name><surname>Xing</surname> <given-names>Y.</given-names></name> <name><surname>Jiang</surname> <given-names>Y.</given-names></name> <name><surname>Luo</surname> <given-names>L.</given-names></name> <name><surname>Sun</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Natural variation in GS5 plays an important role in regulating grain size and yield in rice.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>43</volume> <fpage>1266</fpage>&#x2013;<lpage>1269</lpage>. <pub-id pub-id-type="doi">10.1038/ng.977</pub-id> <pub-id pub-id-type="pmid">22019783</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Shi</surname> <given-names>Y.</given-names></name> <name><surname>Yuan</surname> <given-names>J.</given-names></name> <name><surname>Hu</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Li</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Estimation of genomic characteristics by analyzing k-mer frequency in de novo genome projects.</article-title> <source><italic>Quant. Biol.</italic></source> <volume>35</volume> <fpage>62</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1016/S0925-4005(96)02015-1</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Loman</surname> <given-names>N. J.</given-names></name> <name><surname>Quick</surname> <given-names>J.</given-names></name> <name><surname>Simpson</surname> <given-names>J. T.</given-names></name></person-group> (<year>2015</year>). <article-title>A complete bacterial genome assembled de novo using only nanopore sequencing data.</article-title> <source><italic>Nat. Methods</italic></source> <volume>12</volume> <fpage>733</fpage>&#x2013;<lpage>735</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3444</pub-id> <pub-id pub-id-type="pmid">26076426</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Londo</surname> <given-names>J. P.</given-names></name> <name><surname>Chiang</surname> <given-names>Y.</given-names></name> <name><surname>Hung</surname> <given-names>K.</given-names></name> <name><surname>Chiang</surname> <given-names>T. Y.</given-names></name> <name><surname>Schaal</surname> <given-names>B. A.</given-names></name></person-group> (<year>2006</year>). <article-title>Phylogeography of Asian wild rice, <italic>Oryza rufipogon</italic>, reveals multiple independent domestications of cultivated rice, <italic>Oryza sativa</italic>.</article-title> <source><italic>Proc. Natl. Acad. Sci. U S A.</italic></source> <volume>103</volume> <fpage>9578</fpage>&#x2013;<lpage>9583</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0603152103</pub-id> <pub-id pub-id-type="pmid">16766658</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lowe</surname> <given-names>T. M.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name></person-group> (<year>1997</year>). <article-title>tRNAscan-SE: a program for improved detection of transfer RNA genes in genomic sequence.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>25</volume> <fpage>955</fpage>&#x2013;<lpage>964</lpage>. <pub-id pub-id-type="doi">10.1093/nar/25.5.955</pub-id> <pub-id pub-id-type="pmid">9023104</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>B.</given-names></name> <name><surname>Narede</surname> <given-names>M. E. B.</given-names></name> <name><surname>Juliano</surname> <given-names>A. B.</given-names></name> <name><surname>Jackson</surname> <given-names>M. T.</given-names></name></person-group> (<year>2000</year>). <source><italic>Preliminary Studies on Taxonomy and Biosystematics of the AA Genome Oryza species (Poaceae).</italic></source> <publisher-loc>Clayton, CSU</publisher-loc>: <publisher-name>CSIRO Publishing</publisher-name>.</citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Zhou</surname> <given-names>T.</given-names></name> <name><surname>Gu</surname> <given-names>B.</given-names></name> <name><surname>Huang</surname> <given-names>X.</given-names></name> <name><surname>Shangguan</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>An-1 encodes a basic helix-loop-helix protein that regulates awn development, grain size, and grain number in rice.</article-title> <source><italic>Plant Cell</italic></source> <volume>25</volume> <fpage>3360</fpage>&#x2013;<lpage>3376</lpage>. <pub-id pub-id-type="doi">10.1105/tpc.113.113589</pub-id> <pub-id pub-id-type="pmid">24076974</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>X.</given-names></name> <name><surname>Xu</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Dong</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Tang</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>An ultra-high-density genetic map provides insights into genome synteny, recombination landscape and taproot skin colour in radish (<italic>Raphanus sativus</italic> L.).</article-title> <source><italic>Plant Biotechnol. J.</italic></source> <volume>18</volume> <fpage>274</fpage>&#x2013;<lpage>286</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.13195</pub-id> <pub-id pub-id-type="pmid">31218798</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ma</surname> <given-names>X.</given-names></name> <name><surname>Fu</surname> <given-names>Y.</given-names></name> <name><surname>Zhao</surname> <given-names>X.</given-names></name> <name><surname>Jiang</surname> <given-names>L.</given-names></name> <name><surname>Zhu</surname> <given-names>Z.</given-names></name> <name><surname>Gu</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Genomic structure analysis of a set of <italic>Oryza nivara</italic> introgression lines and identification of yield-associated QTLs using whole-genome resequencing.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>6</volume> <fpage>27425</fpage>&#x2013;<lpage>27437</lpage>. <pub-id pub-id-type="doi">10.1038/srep27425</pub-id> <pub-id pub-id-type="pmid">27251022</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mao</surname> <given-names>H.</given-names></name> <name><surname>Sun</surname> <given-names>S.</given-names></name> <name><surname>Yao</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>C.</given-names></name> <name><surname>Yu</surname> <given-names>S.</given-names></name> <name><surname>Xu</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Linking differential domain functions of the GS3 protein to natural variation of grain size in rice.</article-title> <source><italic>PNAS.</italic></source> <volume>107</volume> <fpage>19579</fpage>&#x2013;<lpage>19584</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1014419107</pub-id> <pub-id pub-id-type="pmid">20974950</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x00E7;ais</surname> <given-names>G.</given-names></name> <name><surname>Kingsford</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>A fast, lock-free approach for efficient parallel counting of occurrences of k-mers.</article-title> <source><italic>Bioinformatics</italic></source> <volume>27</volume> <fpage>764</fpage>&#x2013;<lpage>770</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr011</pub-id> <pub-id pub-id-type="pmid">21217122</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McKenna</surname> <given-names>A.</given-names></name> <name><surname>Hanna</surname> <given-names>M.</given-names></name> <name><surname>Banks</surname> <given-names>E.</given-names></name> <name><surname>Sivachenko</surname> <given-names>A.</given-names></name> <name><surname>Cibulskis</surname> <given-names>K.</given-names></name> <name><surname>Kernytsky</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>The genome analysis toolkit: a mapreduce framework for analyzing next-generation DNA sequencing data.</article-title> <source><italic>Genome Res.</italic></source> <volume>20</volume> <fpage>1297</fpage>&#x2013;<lpage>1303</lpage>. <pub-id pub-id-type="doi">10.1101/gr.107524.110</pub-id> <pub-id pub-id-type="pmid">20644199</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mostovoy</surname> <given-names>Y.</given-names></name> <name><surname>Levy-Sakin</surname> <given-names>M.</given-names></name> <name><surname>Lam</surname> <given-names>J.</given-names></name> <name><surname>Lam</surname> <given-names>E. T.</given-names></name> <name><surname>Hastie</surname> <given-names>A. R.</given-names></name> <name><surname>Marks</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>A hybrid approach for de novo human genome sequence assembly and phasing.</article-title> <source><italic>Nat. Methods</italic></source> <volume>13</volume> <fpage>587</fpage>&#x2013;<lpage>590</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3865</pub-id> <pub-id pub-id-type="pmid">27159086</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nadir</surname> <given-names>S.</given-names></name> <name><surname>Khan</surname> <given-names>S.</given-names></name> <name><surname>Zhu</surname> <given-names>Q.</given-names></name> <name><surname>Henry</surname> <given-names>D.</given-names></name> <name><surname>Wei</surname> <given-names>L.</given-names></name> <name><surname>Lee</surname> <given-names>D. S.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>An overview on reproductive isolation in <italic>Oryza sativa</italic> complex.</article-title> <source><italic>AOB Plants</italic></source> <volume>10</volume> <fpage>60</fpage>&#x2013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1093/aobpla/ply060</pub-id> <pub-id pub-id-type="pmid">30538811</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nikolau</surname> <given-names>B. J.</given-names></name> <name><surname>Ohlrogge</surname> <given-names>J. B.</given-names></name> <name><surname>Wurtele</surname> <given-names>E. S.</given-names></name></person-group> (<year>2003</year>). <article-title>Plant biotin-containing carboxylases.</article-title> <source><italic>Arch. Biochem. Biophys.</italic></source> <volume>414</volume> <fpage>211</fpage>&#x2013;<lpage>222</lpage>. <pub-id pub-id-type="doi">10.1016/S0003-9861(03)00156-5</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oka</surname> <given-names>H. I.</given-names></name></person-group> (<year>1974</year>). <article-title>Experimental studies on the origin of cultivated rice.</article-title> <source><italic>Genetics</italic></source> <volume>78</volume> <fpage>475</fpage>&#x2013;<lpage>486</lpage>. <pub-id pub-id-type="doi">10.1093/genetics/78.1.475</pub-id> <pub-id pub-id-type="pmid">17248664</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ooijen</surname> <given-names>J. V.</given-names></name> <name><surname>Ooijen</surname> <given-names>J. W. V.</given-names></name> <name><surname>Ooijen</surname> <given-names>J.</given-names></name> <name><surname>Hoorn</surname> <given-names>J.</given-names></name> <name><surname>Duin</surname> <given-names>J.</given-names></name> <name><surname>Verlaat</surname> <given-names>J. V. T.</given-names></name></person-group> (<year>2009</year>). <source><italic>MapQTL<sup>&#x00AE;</sup>6. Software for the Mapping of Quantitative Trait Loci in Experimental Populations of Diploid Species.</italic></source> <publisher-loc>Wageningen</publisher-loc>: <publisher-name>Kyazma BV</publisher-name>.</citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peng</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Chen</surname> <given-names>P.</given-names></name> <name><surname>Tang</surname> <given-names>F.</given-names></name> <name><surname>Hu</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>F.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>A chromosome-scale genome assembly of paper mulberry (<italic>Broussonetia papyrifera</italic>) provides new insights into its forage and papermaking usage.</article-title> <source><italic>Mol. Plant</italic></source> <volume>12</volume> <fpage>661</fpage>&#x2013;<lpage>677</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2019.01.021</pub-id> <pub-id pub-id-type="pmid">30822525</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Puttick</surname> <given-names>M. N.</given-names></name></person-group> (<year>2019</year>). <article-title>MCMCtreeR: functions to prepare MCMCtree analyses and visualize posterior ages on trees.</article-title> <source><italic>Bioinformatics</italic></source> <volume>35</volume> <fpage>5321</fpage>&#x2013;<lpage>5322</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz554</pub-id> <pub-id pub-id-type="pmid">31292621</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qi</surname> <given-names>P.</given-names></name> <name><surname>Lin</surname> <given-names>Y. S.</given-names></name> <name><surname>Song</surname> <given-names>X. J.</given-names></name> <name><surname>Shen</surname> <given-names>J. B.</given-names></name> <name><surname>Huang</surname> <given-names>W.</given-names></name> <name><surname>Shan</surname> <given-names>J. X.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>The novel quantitative trait locus GL3.1 controls rice grain size and yield by regulating Cyclin-T1;3.</article-title> <source><italic>Cell Res.</italic></source> <volume>22</volume> <fpage>1666</fpage>&#x2013;<lpage>1680</lpage>. <pub-id pub-id-type="doi">10.1038/cr.2012.151</pub-id> <pub-id pub-id-type="pmid">23147796</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qian</surname> <given-names>Q.</given-names></name> <name><surname>Guo</surname> <given-names>L.</given-names></name> <name><surname>Smith</surname> <given-names>S. M.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>Breeding high-yield superior quality hybrid super rice by rational design.</article-title> <source><italic>Natl. Sci. Rev.</italic></source> <volume>3</volume> <fpage>283</fpage>&#x2013;<lpage>294</lpage>. <pub-id pub-id-type="doi">10.1093/nsr/nww006</pub-id></citation></ref>
<ref id="B68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rao</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Qian</surname> <given-names>Q.</given-names></name></person-group> (<year>2014</year>). <article-title>Recent progress on molecular breeding of rice in China.</article-title> <source><italic>Plant Cell Rep.</italic></source> <volume>33</volume> <fpage>551</fpage>&#x2013;<lpage>564</lpage>. <pub-id pub-id-type="doi">10.1007/s00299-013-1551-x</pub-id> <pub-id pub-id-type="pmid">24442397</pub-id></citation></ref>
<ref id="B69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reisner</surname> <given-names>W.</given-names></name> <name><surname>Larsen</surname> <given-names>R. B.</given-names></name> <name><surname>Silahtaroglu</surname> <given-names>R.</given-names></name> <name><surname>Kristensen</surname> <given-names>R.</given-names></name> <name><surname>Tommerup</surname> <given-names>N.</given-names></name> <name><surname>Tegenfeldt</surname> <given-names>R. O.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Single-molecule denaturation mapping of DNA in nanofluidic channels.</article-title> <source><italic>PNAS.</italic></source> <volume>107</volume> <fpage>13294</fpage>&#x2013;<lpage>13299</lpage>. <pub-id pub-id-type="doi">10.2307/25708710</pub-id></citation></ref>
<ref id="B70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schnable</surname> <given-names>P. S.</given-names></name> <name><surname>Ware</surname> <given-names>D.</given-names></name> <name><surname>Fulton</surname> <given-names>R. S.</given-names></name> <name><surname>Stein</surname> <given-names>J. C.</given-names></name> <name><surname>Wei</surname> <given-names>F.</given-names></name> <name><surname>Pasternak</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>The B73 maize genome: complexity, diversity, and dynamics.</article-title> <source><italic>Science</italic></source> <volume>326</volume> <fpage>1112</fpage>&#x2013;<lpage>1115</lpage>. <pub-id pub-id-type="doi">10.1126/science.1178534</pub-id> <pub-id pub-id-type="pmid">19965430</pub-id></citation></ref>
<ref id="B71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sharma</surname> <given-names>B.</given-names></name> <name><surname>Taganna</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>Genome-wide analysis of the U-box E3 ubiquitin ligase enzyme gene family in tomato.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>10</volume>:<fpage>9581</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-66553-1</pub-id> <pub-id pub-id-type="pmid">32533036</pub-id></citation></ref>
<ref id="B72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shinobu</surname> <given-names>N.</given-names></name> <name><surname>Junko</surname> <given-names>S.</given-names></name> <name><surname>Rieko</surname> <given-names>O.</given-names></name> <name><surname>Kana</surname> <given-names>H.</given-names></name> <name><surname>Rika</surname> <given-names>Y.</given-names></name> <name><surname>Noriyuki</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2002</year>). <article-title>Search for and analysis of single nucleotide polymorphisms (SNPs) in rice (<italic>Oryza sativa</italic>, <italic>Oryza rufipogon</italic>) and establishment of SNP markers.</article-title> <source><italic>DNA Res.</italic></source> <volume>9</volume> <fpage>163</fpage>&#x2013;<lpage>171</lpage>. <pub-id pub-id-type="doi">10.1093/dnares/9.5.163</pub-id> <pub-id pub-id-type="pmid">12465716</pub-id></citation></ref>
<ref id="B73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shivrain</surname> <given-names>V. K.</given-names></name> <name><surname>Burgos</surname> <given-names>N. R.</given-names></name> <name><surname>Sales</surname> <given-names>M. A.</given-names></name> <name><surname>Yong</surname> <given-names>Y. I.</given-names></name></person-group> (<year>2010</year>). <article-title>Polymorphisms in the ALS gene of weedy rice (<italic>Oryza sativa</italic> L.) accessions with differential tolerance to imazethapyr.</article-title> <source><italic>Crop Protect.</italic></source> <volume>29</volume> <fpage>336</fpage>&#x2013;<lpage>341</lpage>. <pub-id pub-id-type="doi">10.1016/j.cropro.2009.10.002</pub-id></citation></ref>
<ref id="B74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shomura</surname> <given-names>A.</given-names></name> <name><surname>Izawa</surname> <given-names>T.</given-names></name> <name><surname>Ebana</surname> <given-names>K.</given-names></name> <name><surname>Ebitani</surname> <given-names>T.</given-names></name> <name><surname>Kanegae</surname> <given-names>H.</given-names></name> <name><surname>Konishi</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Deletion in a gene associated with grain size increased yields during rice domestication.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>40</volume> <fpage>1023</fpage>&#x2013;<lpage>1028</lpage>. <pub-id pub-id-type="doi">10.1038/ng.169</pub-id> <pub-id pub-id-type="pmid">18604208</pub-id></citation></ref>
<ref id="B75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sim&#x00E3;o</surname> <given-names>F. A.</given-names></name> <name><surname>Waterhouse</surname> <given-names>R. M.</given-names></name> <name><surname>Panagiotis</surname> <given-names>I.</given-names></name> <name><surname>Kriventseva</surname> <given-names>E. V.</given-names></name> <name><surname>Zdobnov</surname> <given-names>E. M.</given-names></name></person-group> (<year>2015</year>). <article-title>BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>3210</fpage>&#x2013;<lpage>3212</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv351</pub-id> <pub-id pub-id-type="pmid">26059717</pub-id></citation></ref>
<ref id="B76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>X.</given-names></name> <name><surname>Huang</surname> <given-names>W.</given-names></name> <name><surname>Shi</surname> <given-names>M.</given-names></name> <name><surname>Zhu</surname> <given-names>M. Z.</given-names></name> <name><surname>Lin</surname> <given-names>H. X.</given-names></name></person-group> (<year>2007</year>). <article-title>A QTL for rice grain width and weight encodes a previously unknown RING-type E3 ubiquitin ligase.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>39</volume> <fpage>623</fpage>&#x2013;<lpage>630</lpage>. <pub-id pub-id-type="doi">10.1038/ng2014</pub-id> <pub-id pub-id-type="pmid">17417637</pub-id></citation></ref>
<ref id="B77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Spannagl</surname> <given-names>M.</given-names></name> <name><surname>Nussbaumer</surname> <given-names>T.</given-names></name> <name><surname>Bader</surname> <given-names>K. C.</given-names></name> <name><surname>Martis</surname> <given-names>M. M.</given-names></name> <name><surname>Seidel</surname> <given-names>M.</given-names></name> <name><surname>Kugler</surname> <given-names>K. G.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>PGSB PlantsDB: updates to the database framework for comparative plant genome research.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume> <fpage>D1141</fpage>&#x2013;<lpage>D1147</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv1130</pub-id> <pub-id pub-id-type="pmid">26527721</pub-id></citation></ref>
<ref id="B78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stam</surname> <given-names>P.</given-names></name></person-group> (<year>1993</year>). <article-title>Construction of integrated genetic linkage maps by means of a new computer package: join map.</article-title> <source><italic>Plant J.</italic></source> <volume>3</volume> <fpage>739</fpage>&#x2013;<lpage>744</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-313X.1993.00739.x</pub-id></citation></ref>
<ref id="B79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stamatakis</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>RAxML version 8: a tool for phylogenetic analysis and post-analysis of large phylogenies.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1312</fpage>&#x2013;<lpage>1313</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu033</pub-id> <pub-id pub-id-type="pmid">24451623</pub-id></citation></ref>
<ref id="B80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Diekhans</surname> <given-names>M.</given-names></name> <name><surname>Baertsch</surname> <given-names>R.</given-names></name> <name><surname>Haussler</surname> <given-names>D.</given-names></name></person-group> (<year>2008</year>). <article-title>Using native and syntenically mapped cDNA alignments to improve de novo gene finding.</article-title> <source><italic>Bioinformatics</italic></source> <volume>24</volume> <fpage>637</fpage>&#x2013;<lpage>644</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btn013</pub-id> <pub-id pub-id-type="pmid">18218656</pub-id></citation></ref>
<ref id="B81"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Waack</surname> <given-names>S.</given-names></name></person-group> (<year>2003</year>). <article-title>Gene prediction with a hidden Markov model and a new intron submodel.</article-title> <source><italic>Bioinformatics</italic></source> <volume>19</volume> <fpage>215</fpage>&#x2013;<lpage>225</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btg1080</pub-id> <pub-id pub-id-type="pmid">14534192</pub-id></citation></ref>
<ref id="B82"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stein</surname> <given-names>J. C.</given-names></name> <name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Copetti</surname> <given-names>D.</given-names></name> <name><surname>Zwickl</surname> <given-names>D. J.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Genomes of 13 domesticated and wild rice relatives highlight genetic conservation, turnover and innovation across the genus <italic>Oryza</italic>.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>7</volume> <fpage>285</fpage>&#x2013;<lpage>296</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-018-0040-0</pub-id> <pub-id pub-id-type="pmid">29358651</pub-id></citation></ref>
<ref id="B83"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Yoshimura</surname> <given-names>A.</given-names></name> <name><surname>Doi</surname> <given-names>K.</given-names></name></person-group> (<year>2002</year>). <article-title>Genetic differentiation for nuclear, mitochondrial and chloroplast genomes in common wild rice (<italic>Oryza rufipogon</italic> Griff.) and cultivated rice (<italic>Oryza sativa</italic> L.).</article-title> <source><italic>Theor. Appl. Genet.</italic></source> <volume>104</volume> <fpage>1335</fpage>&#x2013;<lpage>1345</lpage>. <pub-id pub-id-type="doi">10.1007/s00122-002-0878-4</pub-id> <pub-id pub-id-type="pmid">12582589</pub-id></citation></ref>
<ref id="B84"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>J.</given-names></name> <name><surname>Ma</surname> <given-names>D.</given-names></name> <name><surname>Tang</surname> <given-names>L.</given-names></name> <name><surname>Zhao</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>G.</given-names></name> <name><surname>Wang</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Population genomic analysis and de novo assembly reveal the origin of weedy rice as an evolutionary game.</article-title> <source><italic>Mol. Plant</italic></source> <volume>12</volume> <fpage>632</fpage>&#x2013;<lpage>647</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2019.01.019</pub-id> <pub-id pub-id-type="pmid">30710646</pub-id></citation></ref>
<ref id="B85"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>J.</given-names></name> <name><surname>Qian</surname> <given-names>Q.</given-names></name> <name><surname>Ma</surname> <given-names>D. R.</given-names></name> <name><surname>Xu</surname> <given-names>Z. J.</given-names></name> <name><surname>Liu</surname> <given-names>D.</given-names></name> <name><surname>Du</surname> <given-names>H. B.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Introgression and selection shaping the genome and adaptive loci of weedy rice in northern China.</article-title> <source><italic>New Phytol.</italic></source> <volume>197</volume> <fpage>290</fpage>&#x2013;<lpage>299</lpage>. <pub-id pub-id-type="doi">10.1111/nph.12012</pub-id> <pub-id pub-id-type="pmid">23106357</pub-id></citation></ref>
<ref id="B86"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>X.</given-names></name> <name><surname>Jia</surname> <given-names>Q.</given-names></name> <name><surname>Guo</surname> <given-names>Y.</given-names></name> <name><surname>Zheng</surname> <given-names>X.</given-names></name> <name><surname>Liang</surname> <given-names>K.</given-names></name></person-group> (<year>2015</year>). <article-title>Whole-genome analysis revealed the positively selected genes during the differentiation of indica and temperate japonica rice.</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<fpage>e0119239</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0119239</pub-id> <pub-id pub-id-type="pmid">25774680</pub-id></citation></ref>
<ref id="B87"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vaughan</surname> <given-names>D. A.</given-names></name> <name><surname>Bal&#x00E1;zs</surname> <given-names>E.</given-names></name> <name><surname>Heslop-Harrison</surname> <given-names>J. S.</given-names></name></person-group> (<year>2007</year>). <article-title>From crop domestication to super-domestication.</article-title> <source><italic>Ann. Bot.</italic></source> <volume>100</volume> <fpage>893</fpage>&#x2013;<lpage>901</lpage>. <pub-id pub-id-type="doi">10.1093/aob/mcm224</pub-id> <pub-id pub-id-type="pmid">17940074</pub-id></citation></ref>
<ref id="B88"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Walker</surname> <given-names>B. J.</given-names></name> <name><surname>Abeel</surname> <given-names>T.</given-names></name> <name><surname>Shea</surname> <given-names>T.</given-names></name> <name><surname>Priest</surname> <given-names>M.</given-names></name> <name><surname>Abouelliel</surname> <given-names>A.</given-names></name> <name><surname>Sakthikumar</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Pilon: an integrated tool for comprehensive microbial variant detection and genome assembly improvement.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<fpage>e112963</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0112963</pub-id> <pub-id pub-id-type="pmid">25409509</pub-id></citation></ref>
<ref id="B89"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>C.</given-names></name> <name><surname>Yu</surname> <given-names>H.</given-names></name> <name><surname>Huang</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Faruquee</surname> <given-names>M.</given-names></name> <name><surname>Zhang</surname> <given-names>F.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Towards a deeper haplotype mining of complex traits in rice with RFGB v2.0.</article-title> <source><italic>Plant Biotechnol J.</italic></source> <volume>18</volume> <fpage>14</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.13215</pub-id> <pub-id pub-id-type="pmid">31336017</pub-id></citation></ref>
<ref id="B90"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>F.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>C.</given-names></name> <name><surname>Gong</surname> <given-names>J.</given-names></name> <name><surname>Song</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Identification of candidate genes for key fibre-related QTLs and derivation of favourable alleles in <italic>Gossypium hirsutum</italic> recombinant inbred lines with <italic>G.barbadense</italic> introgressions.</article-title> <source><italic>Plant Biotechnol. J.</italic></source> <volume>18</volume> <fpage>707</fpage>&#x2013;<lpage>720</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.13237</pub-id> <pub-id pub-id-type="pmid">31446669</pub-id></citation></ref>
<ref id="B91"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Wu</surname> <given-names>K.</given-names></name> <name><surname>Yuan</surname> <given-names>Q.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>Z.</given-names></name> <name><surname>Lin</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2012b</year>). <article-title>Control of grain size, shape and quality by OsSPL16 in rice.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>44</volume> <fpage>950</fpage>&#x2013;<lpage>954</lpage>. <pub-id pub-id-type="doi">10.1038/ng.2327</pub-id> <pub-id pub-id-type="pmid">22729225</pub-id></citation></ref>
<ref id="B92"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Basten</surname> <given-names>C. J.</given-names></name> <name><surname>Zeng</surname> <given-names>Z.</given-names></name></person-group> (<year>2012a</year>). <source><italic>Windows QTL Cartographer v2.5. Department of Statistics.</italic></source> <publisher-loc>Raleigh, NC</publisher-loc>: <publisher-name>North Carolina State University</publisher-name>.</citation></ref>
<ref id="B93"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Tang</surname> <given-names>H.</given-names></name> <name><surname>Debarry</surname> <given-names>J. D.</given-names></name> <name><surname>Tan</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2012c</year>). <article-title>MCScanX: a toolkit for detection and evolutionary analysis of gene synteny and collinearity.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>40</volume>:<fpage>e49</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkr1293</pub-id> <pub-id pub-id-type="pmid">22217600</pub-id></citation></ref>
<ref id="B94"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>W.</given-names></name> <name><surname>Mauleon</surname> <given-names>R.</given-names></name> <name><surname>Hu</surname> <given-names>Z.</given-names></name> <name><surname>Chebotarov</surname> <given-names>D.</given-names></name> <name><surname>Tai</surname> <given-names>S.</given-names></name> <name><surname>Wu</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Genomic variation in 3,010 diverse accessions of Asian cultivated rice.</article-title> <source><italic>Nature</italic></source> <volume>557</volume> <fpage>43</fpage>&#x2013;<lpage>49</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-018-0063-9</pub-id> <pub-id pub-id-type="pmid">29695866</pub-id></citation></ref>
<ref id="B95"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>C.</given-names></name> <name><surname>Gao</surname> <given-names>Y.</given-names></name> <name><surname>Xie</surname> <given-names>W.</given-names></name> <name><surname>Liang</surname> <given-names>G.</given-names></name> <name><surname>Kai</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Genome-wide association analyses provide genetic and biochemical insights into natural variation in rice metabolism.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>46</volume> <fpage>714</fpage>&#x2013;<lpage>721</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3007</pub-id> <pub-id pub-id-type="pmid">24908251</pub-id></citation></ref>
<ref id="B96"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wet</surname> <given-names>J. M. J. D.</given-names></name> <name><surname>Harlan</surname> <given-names>J. R.</given-names></name></person-group> (<year>1975</year>). <article-title>Weeds and domesticates: evolution in the man-made habitat.</article-title> <source><italic>Econ. Bot.</italic></source> <volume>29</volume> <fpage>99</fpage>&#x2013;<lpage>107</lpage>. <pub-id pub-id-type="doi">10.1007/BF02863309</pub-id></citation></ref>
<ref id="B97"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xiao</surname> <given-names>M.</given-names></name> <name><surname>Phong</surname> <given-names>A.</given-names></name> <name><surname>Ha</surname> <given-names>C.</given-names></name> <name><surname>Chan</surname> <given-names>T. F.</given-names></name> <name><surname>Cai</surname> <given-names>D.</given-names></name> <name><surname>Leung</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Rapid DNA mapping by fluorescent single molecule detection.</article-title> <source><italic>Nuclc Acids Res.</italic></source> <volume>35</volume>:<fpage>e16</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl1044</pub-id> <pub-id pub-id-type="pmid">17175538</pub-id></citation></ref>
<ref id="B98"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>J.</given-names></name> <name><surname>Xing</surname> <given-names>Y.</given-names></name> <name><surname>Xu</surname> <given-names>Y.</given-names></name> <name><surname>Wan</surname> <given-names>J.</given-names></name></person-group> (<year>2021</year>). <article-title>Breeding by design for future rice: genes and genome technologies.</article-title> <source><italic>Crop J.</italic></source> <volume>9</volume> <fpage>491</fpage>&#x2013;<lpage>496</lpage>. <pub-id pub-id-type="doi">10.1016/j.cj.2021.03.006</pub-id></citation></ref>
<ref id="B99"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xun</surname> <given-names>X.</given-names></name> <name><surname>Xin</surname> <given-names>L.</given-names></name> <name><surname>Song</surname> <given-names>G.</given-names></name> <name><surname>Jensen</surname> <given-names>J. D.</given-names></name> <name><surname>Hu</surname> <given-names>F.</given-names></name> <name><surname>Li</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Resequencing 50 accessions of cultivated and wild rice yields markers for identifying agronomically important genes.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>30</volume> <fpage>105</fpage>&#x2013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.2050</pub-id> <pub-id pub-id-type="pmid">22158310</pub-id></citation></ref>
<ref id="B100"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>C.</given-names></name> <name><surname>Zhao</surname> <given-names>N.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Hu</surname> <given-names>Z.</given-names></name> <name><surname>Chen</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Chinese root-type mustard provides phylogenomic insights into the evolution of the multi-use diversified allopolyploid <italic>Brassica juncea</italic>.</article-title> <source><italic>Mol. Plant</italic></source> <volume>11</volume> <fpage>512</fpage>&#x2013;<lpage>514</lpage>. <pub-id pub-id-type="doi">10.1055/s-0043-120348</pub-id> <pub-id pub-id-type="pmid">29113005</pub-id></citation></ref>
<ref id="B101"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>W.</given-names></name> <name><surname>Wu</surname> <given-names>K.</given-names></name> <name><surname>Wang</surname> <given-names>B.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Guo</surname> <given-names>S.</given-names></name> <name><surname>Guo</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>The RING E3 ligase CLG1 targets GS3 for degradation via the endosome pathway to determine grain size in rice.</article-title> <source><italic>Mol. Plant</italic></source> <volume>14</volume> <fpage>1699</fpage>&#x2013;<lpage>1713</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2021.06.027</pub-id> <pub-id pub-id-type="pmid">34216830</pub-id></citation></ref>
<ref id="B102"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>X.</given-names></name> <name><surname>Hwa</surname> <given-names>C.</given-names></name></person-group> (<year>2008</year>). <article-title>Genetic modification of plant architecture and variety improvement in rice.</article-title> <source><italic>Heredity</italic></source> <volume>101</volume> <fpage>396</fpage>&#x2013;<lpage>404</lpage>. <pub-id pub-id-type="doi">10.1038/hdy.2008.90</pub-id> <pub-id pub-id-type="pmid">18716608</pub-id></citation></ref>
<ref id="B103"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Z.</given-names></name></person-group> (<year>2007</year>). <article-title>PAML 4: phylogenetic analysis by maximum likelihood.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>24</volume> <fpage>1586</fpage>&#x2013;<lpage>1591</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msm088</pub-id> <pub-id pub-id-type="pmid">17483113</pub-id></citation></ref>
<ref id="B104"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yano</surname> <given-names>K.</given-names></name> <name><surname>Yamamoto</surname> <given-names>E.</given-names></name> <name><surname>Aya</surname> <given-names>K.</given-names></name> <name><surname>Takeuchi</surname> <given-names>H.</given-names></name> <name><surname>Lo</surname> <given-names>P. C.</given-names></name> <name><surname>Hu</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Genome-wide association study using whole-genome sequencing rapidly identifies new genes influencing agronomic traits in rice.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>48</volume> <fpage>927</fpage>&#x2013;<lpage>934</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3596</pub-id> <pub-id pub-id-type="pmid">27322545</pub-id></citation></ref>
<ref id="B105"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>J.</given-names></name> <name><surname>Hu</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name> <name><surname>Wong</surname> <given-names>K. S. G.</given-names></name> <name><surname>Liu</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2002</year>). <article-title>A draft sequence of the rice genome (<italic>Oryza sativa</italic> L. ssp. indica).</article-title> <source><italic>Science</italic></source> <volume>296</volume> <fpage>79</fpage>&#x2013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1126/science.1068037</pub-id> <pub-id pub-id-type="pmid">11935017</pub-id></citation></ref>
<ref id="B106"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zdobnov</surname> <given-names>E. M.</given-names></name> <name><surname>Apweiler</surname> <given-names>R.</given-names></name></person-group> (<year>2001</year>). <article-title>InterProScan&#x2013;an integration platform for the signature-recognition methods in InterPro.</article-title> <source><italic>Bioinformatics</italic></source> <volume>17</volume> <fpage>847</fpage>&#x2013;<lpage>848</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/17.9.847</pub-id> <pub-id pub-id-type="pmid">11590104</pub-id></citation></ref>
<ref id="B107"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zeng</surname> <given-names>L.</given-names></name> <name><surname>Tu</surname> <given-names>X.-L.</given-names></name> <name><surname>Dai</surname> <given-names>H.</given-names></name> <name><surname>Han</surname> <given-names>F.</given-names></name> <name><surname>Lu</surname> <given-names>B.</given-names></name> <name><surname>Wang</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Whole genomes and transcriptomes reveal adaptation and domestication of pistachio.</article-title> <source><italic>Genome Biol.</italic></source> <volume>20</volume>:<fpage>79</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-019-1686-3</pub-id> <pub-id pub-id-type="pmid">30999938</pub-id></citation></ref>
<ref id="B108"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Xing</surname> <given-names>F.</given-names></name> <name><surname>Kudrna</surname> <given-names>D. A.</given-names></name> <name><surname>Yao</surname> <given-names>W.</given-names></name> <name><surname>Copetti</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Extensive sequence divergence between the reference genomes of two elite indica rice varieties Zhenshan 97 and Minghui 63.</article-title> <source><italic>Proc. Natl. Acad. U S A.</italic></source> <volume>113</volume> <fpage>E5163</fpage>&#x2013;<lpage>E5171</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1611012113</pub-id> <pub-id pub-id-type="pmid">27535938</pub-id></citation></ref>
<ref id="B109"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Q.</given-names></name> <name><surname>Liang</surname> <given-names>Z.</given-names></name> <name><surname>Cui</surname> <given-names>X.</given-names></name> <name><surname>Ji</surname> <given-names>C.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>N6-Methyladenine DNA methylation in Japonica and indica rice genomes and its association with gene expression, plant development, and stress responses.</article-title> <source><italic>Mol. Plant</italic></source> <volume>11</volume> <fpage>1492</fpage>&#x2013;<lpage>1508</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2018.11.005</pub-id> <pub-id pub-id-type="pmid">30448535</pub-id></citation></ref>
<ref id="B110"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Q.</given-names></name> <name><surname>Zhu</surname> <given-names>T.</given-names></name> <name><surname>Xia</surname> <given-names>E.</given-names></name> <name><surname>Shi</surname> <given-names>C.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Rapid diversification of five Oryza AA genomes associated with rice adaptation.</article-title> <source><italic>Proc. Natl. Acad. Sci. U S A.</italic></source> <volume>111</volume> <fpage>4954</fpage>&#x2013;<lpage>4962</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1418307111</pub-id> <pub-id pub-id-type="pmid">25368197</pub-id></citation></ref>
<ref id="B111"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>Q.</given-names></name> <name><surname>Ge</surname> <given-names>S.</given-names></name></person-group> (<year>2005</year>). <article-title>Phylogenetic relationships among a-genome species of the genus Oryza revealed by intron sequences of four nuclear genes.</article-title> <source><italic>New Phytol.</italic></source> <volume>167</volume> <fpage>249</fpage>&#x2013;<lpage>265</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.2005.01406.x</pub-id> <pub-id pub-id-type="pmid">15948847</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://plants.ensembl.org">http://plants.ensembl.org</ext-link></p></fn>
</fn-group>
</back>
</article>