<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fgene.2020.580568</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Improved <italic>de novo</italic> Assembly of the Achlorophyllous Orchid <italic>Gastrodia elata</italic></article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Shanshan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/696229/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Xiao</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1125117/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Yangzi</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Guanghui</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/347812/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Song</surname> <given-names>Wanling</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Dong</surname> <given-names>Xiao</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/911435/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Arnold</surname> <given-names>Michael L.</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/228226/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Wen</given-names></name>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<xref ref-type="aff" rid="aff10"><sup>10</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Miao</surname> <given-names>Jianhua</given-names></name>
<xref ref-type="aff" rid="aff11"><sup>11</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname> <given-names>Wei</given-names></name>
<xref ref-type="aff" rid="aff12"><sup>12</sup></xref>
<xref ref-type="aff" rid="aff13"><sup>13</sup></xref>
<xref ref-type="aff" rid="aff14"><sup>14</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1023205/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Dong</surname> <given-names>Yang</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="aff" rid="aff11"><sup>11</sup></xref>
<xref ref-type="aff" rid="aff12"><sup>12</sup></xref>
<xref ref-type="aff" rid="aff14"><sup>14</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/694956/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>School of Life Sciences, Zhengzhou University</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>BGI College, Zhengzhou University</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>State Key Laboratory of Genetic Resources and Evolution, Kunming Institute of Zoology, Chinese Academy of Sciences</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Jiaxing Synbiolab Biotechnology Co., Ltd.</institution>, <addr-line>Jiaxing</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>College of Biological Big Data, Yunnan Agricultural University</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff6"><sup>6</sup><institution>The Key Laboratory of Medicinal Plant Biology of Yunnan Province, National and Local Joint Engineering Research Center on Germplasm Innovation and Utilization of Chinese Medicinal Materials in Southwest China, Yunnan Agricultural University</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Genetics, University of Georgia</institution>, <addr-line>Athens, GA</addr-line>, <country>United States</country></aff>
<aff id="aff8"><sup>8</sup><institution>State Key Laboratory of Genetic Resources and Evolution, Kunming Institute of Zoology, Chinese Academy of Sciences</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff9"><sup>9</sup><institution>Center for Ecological and Environmental Sciences, Northwestern Polytechnical University</institution>, <addr-line>Xi&#x2019;an</addr-line>, <country>China</country></aff>
<aff id="aff10"><sup>10</sup><institution>Center for Excellence in Animal Evolution and Genetics, Chinese Academy of Sciences</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff11"><sup>11</sup><institution>Guangxi Key Laboratory of Medicinal Resources Protection and Genetic Improvement, Guangxi Botanical Garden of Medicinal Plants</institution>, <addr-line>Nanning</addr-line>, <country>China</country></aff>
<aff id="aff12"><sup>12</sup><institution>State Key Laboratory of Conservation and Utilization of Bio-Resources in Yunnan, Yunnan Agricultural University</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff13"><sup>13</sup><institution>College of Agronomy and Biotechnology, Yunnan Agricultural University</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff14"><sup>14</sup><institution>Yunnan Research Institute for Local Plateau Agriculture and Industry</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Wei Chen, North China University of Science and Technology, China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Liangsheng Zhang, Zhejiang University, China; Xiaohua Jin, Institute of Botany (CAS), China</p></fn>
<corresp id="c001">&#x002A;Correspondence: Jianhua Miao, <email>mjh1962@vip.163.com</email></corresp>
<corresp id="c002">Wei Chen, <email>wchenntr@gmail.com</email></corresp>
<corresp id="c003">Yang Dong, <email>loyalyang@163.com</email></corresp>
<fn fn-type="other" id="fn002"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn fn-type="other" id="fn004"><p>This article was submitted to Plant Genomics, a section of the journal Frontiers in Genetics</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>11</month>
<year>2020</year>
</pub-date>
<pub-date pub-type="collection">
<year>2020</year>
</pub-date>
<volume>11</volume>
<elocation-id>580568</elocation-id>
<history>
<date date-type="received">
<day>06</day>
<month>07</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>10</month>
<year>2020</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2020 Chen, Wang, Wang, Zhang, Song, Dong, Arnold, Wang, Miao, Chen and Dong.</copyright-statement>
<copyright-year>2020</copyright-year>
<copyright-holder>Chen, Wang, Wang, Zhang, Song, Dong, Arnold, Wang, Miao, Chen and Dong</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Achlorophyllous plants are full mycoheterotrophic plants with no chlorophyll and they obtain their nutrients from soil fungi. <italic>Gastrodia elata</italic> is a perennial, achlorophyllous orchid that displays distinctive evolutionary strategy of adaptation to the non-photosynthetic lifestyle. Here in this study, the genome of <italic>G. elata</italic> was assembled to 1.12 Gb with a contig N50 size of 110 kb and a scaffold N50 size of 1.64 Mb so that it helped unveil the genetic basics of those adaptive changes. Based on the genomic data, key genes related to photosynthesis, leaf development, and plastid division pathways were found to be lost or under relaxed selection during the course of evolution. Thus, the genome sequence of <italic>G. elata</italic> provides a good resource for future investigations of the evolution of orchids and other achlorophyllous plants.</p>
</abstract>
<kwd-group>
<kwd><italic>Gastrodia elata</italic></kwd>
<kwd>genome</kwd>
<kwd>achlorophyllous</kwd>
<kwd>relaxed selection</kwd>
<kwd>non-photosynthetic</kwd>
</kwd-group>
<counts>
<fig-count count="3"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="46"/>
<page-count count="10"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1">
<title>Introduction</title>
<p>In the autotroph-dominant plant world, the symbiotic relationship between plants and fungi plays an indispensable role in the maintenance of ecosystem (<xref ref-type="bibr" rid="B31">Read, 1991</xref>). In an extreme situation, some plants (at least 50 independent origins) have become solely dependent upon their fungal associates for energy source and other nutrients during the course of evolution (<xref ref-type="bibr" rid="B28">Merckx and Freudenstein, 2010</xref>). These fully mycoheterotrophic plants often lack a functional photosynthetic mechanism, so they are termed as &#x201C;non-photosynthetic plants (<xref ref-type="bibr" rid="B27">Merckx et al., 2009</xref>).&#x201D;</p>
<p>The loss of photosynthesis was independently evolved over 40 times in a diverse range of plant families and genera (<xref ref-type="bibr" rid="B2">Bidartondo, 2005</xref>). As an evolutionary adaptation to a low-light undergrowth environment, this extreme phenotype was also associated with some quite remarkable parallel evolutionary traits in plant, such as smaller biomass, specialized leaves without stomata, lack of root hair, reduced vascular tissues, and miniatured seeds (<xref ref-type="bibr" rid="B21">Leake, 1994</xref>). Even though multiple studies of plastomes from heterotrophic plants have showed reduction in plastome sizes and housekeeping gene numbers (<xref ref-type="bibr" rid="B16">Krause, 2008</xref>; <xref ref-type="bibr" rid="B1">Barrett and Davis, 2012</xref>; <xref ref-type="bibr" rid="B38">Wicke et al., 2013</xref>, <xref ref-type="bibr" rid="B39">2014</xref>), the nuclear genomic basis of the other parallel traits in non-photosynthetic plants remains elusive.</p>
<p>All members of the Orchidaceae family (up to 26,567 species in 880 genera) rely on fungal associates in some or all stages of their life cycle (<xref ref-type="bibr" rid="B21">Leake, 1994</xref>; <xref ref-type="bibr" rid="B3">Cai et al., 2015</xref>). In particular, more than 200 orchid species from a myriad genera are fully mycoheterotrophic and non-photosynthetic (<xref ref-type="bibr" rid="B21">Leake, 1994</xref>; <xref ref-type="bibr" rid="B27">Merckx et al., 2009</xref>; <xref ref-type="bibr" rid="B28">Merckx and Freudenstein, 2010</xref>). Since <italic>Gastrodia</italic> is one of the largest genera consisting of fully mycoheterotrophic species from a wide geographic area (<xref ref-type="bibr" rid="B4">Cribb and Killmann, 2010</xref>), members in this genus are excellent models to investigate the reconfigured traits in non-photosynthetic plants.</p>
<p>In China, <italic>Gastrodia elata</italic> is cultivated for medicinal uses. It is a perennial, non-photosynthetic orchid with an enlarged rhizome and vestigial leaves on an upright flower-bearing stem (<xref ref-type="fig" rid="F1">Figure 1A</xref>). The completion of its life cycle requires at least two types of fungi: <italic>Armillaria</italic> and <italic>Mycena</italic> (<xref ref-type="bibr" rid="B19">Lan et al., 1994</xref>; <xref ref-type="bibr" rid="B29">Ning et al., 2010</xref>) (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 1</xref>). In this study, we presented a high quality <italic>de novo</italic> assembly of the <italic>G. elata</italic> nuclear genome, which had a higher coverage, contig N50 size, and Benchmarking Universal Single-Copy Ortholog (BUSCO) completeness than that of a previous report (<xref ref-type="bibr" rid="B44">Yuan et al., 2018</xref>). Compared with the genomes of photosynthetic orchid species, such as <italic>Phalaenopsis equestris</italic> (<xref ref-type="bibr" rid="B3">Cai et al., 2015</xref>), <italic>Apostasia Shenzhenica</italic> (<xref ref-type="bibr" rid="B45">Zhang et al., 2017</xref>), and <italic>Dendrobium officinale</italic> (<xref ref-type="bibr" rid="B41">Yan et al., 2015</xref>), the new <italic>G. elata</italic> nuclear genome and plastome assemblies showed key gene loss and relaxed selection related to its non-functional photosystem and retarded leaf development. These data demonstrated that the improved <italic>G. elata</italic> genome provides more insights into the genomic and evolutionary mechanisms underlying the morphological and physiological adaptations associated with a non-photosynthetic lifestyle.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Divergence time and morphology of <italic>G. elata</italic>. <bold>(A)</bold> Morphology of <italic>G. elata</italic>: photos showing a whole plant, flower, stem with degraded blade and tuber. <bold>(B)</bold> Divergence times are indicated by pink bars, expanded gene family numbers by dark blue letters and contracted gene families by orange letters.</p></caption>
<graphic xlink:href="fgene-11-580568-g001.tif"/>
</fig>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Plant Material, Genomic DNA Extraction, and Library Construction</title>
<p>A flowering <italic>G. elata</italic> Bl. f. glauca S. Chow plant was collected from Zhaotong, Yunnan Province, China (103&#x00B0;43&#x2032;E, 27&#x00B0;20&#x2032;N). Genomic DNA was extracted from fresh stems by the Qiagen DNeasy Plant Mini Kit (Cat. No. 69104). After genomic DNA purification and quality validation, 10 paired-end and mate-pair DNA libraries with insert sizes of 169 bp (&#x00D7;2), 300 bp (&#x00D7;2), 374 bp, 545 bp, 753 kb, 2 kb, 5 kb, and 10 kb were constructed using library construction kits (Illumina) as previously described (<xref ref-type="bibr" rid="B23">Liang et al., 2015</xref>; <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>).</p>
</sec>
<sec id="S2.SS2">
<title>Genome Sequencing and Assembly</title>
<p>A whole-genome shotgun strategy was adopted to sequence and assemble the genome of <italic>G. elata</italic>. All ten DNA libraries were sequenced on an Illumina HiSeq 2000 platform and 483.07 Gb of data was obtained. The genome size of <italic>G. elata</italic> was estimated according to the 17-mer frequency distribution with the formula: Genome size = <italic>K</italic>-mer_num/Peak_depth. Total of 84.67 Gb data was retained for 17-mer analysis. The 17-mer frequency distribution plot shows the peak at 66 (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 2</xref>), and the total <italic>K</italic>-mer count is 90,917,019,718, then the genome size is estimated as 1.378 Gb.</p>
<p>The assembly of <italic>G. elata</italic> genome was carried out using the SOAPdenovo. A <italic>de Bruijn</italic> graph was constructed using the parameter &#x201C;&#x2212;K 83 &#x2212;d 3&#x201D;, then the graph was simplified using &#x201C;&#x2212;M 3&#x201D; parameters to clip tips, remove low coverage links, merge bubbles, and solve tiny repeats. Those repeats on the simplified graph were broken at the boundaries and unambiguous DNA fragments were produced as contigs. Filtered sequencing data was then realigned to contigs with the parameters &#x201C;&#x2212;k 83&#x201D;. Parameter &#x201C;&#x2212;F&#x201D; was used to deal with the paired-end information, and unique contigs were joined to construct scaffolds. Gapcloser (v1.12) was used to fill the gaps between scaffolds with the default parameters.<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> Contigs short than 100 bp were excluded within the whole assembly process.</p>
<p>The completeness and accuracy of the gap closed assembly was assessed using short insert-sized sequencing reads, conserved genes, and RNA-seq data. Filtered reads from three small-insert libraries (169, 374, and 753 bp) were mapped to the assembled genome using the bowtie2 (version 2.2.9<sup><xref ref-type="fn" rid="footnote2">2</xref></sup>) (<xref ref-type="bibr" rid="B20">Langmead and Salzberg, 2012</xref>) with default parameters to estimate the quality of the assembly. The overall mapping rates of these small-insert size reads is higher than 92%, suggesting that most of the <italic>G. elata</italic> genome has been assembled. BUSCOs approach (<xref ref-type="bibr" rid="B37">Waterhouse et al., 2017</xref>) was also used to evaluate the completeness of the <italic>G. elata</italic> genome. Three hundred and three (303) conserved single-copy orthologs has been used as reference, of which 248 (81.85%) were identified in our genome assembly (<xref ref-type="table" rid="T1">Table 1</xref>). Over 74.59 millions of cleaned RNA-seq reads from three different <italic>G. elata</italic> tissues (flower, stem, and tuber) were mapped to the assembled genome with the default settings using the TopHat2 (version 2.0.14<sup><xref ref-type="fn" rid="footnote3">3</xref></sup>) (<xref ref-type="bibr" rid="B35">Trapnell et al., 2009</xref>; <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 2</xref>), and we observed the average mapping ratio of 83%, further validate the high completeness of <italic>G. elata</italic> genome assembly.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Various assembly parameters of the <italic>G. elata</italic> genome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center"/>
<td valign="top" align="center"><italic>G. elata</italic></td>
</tr>
<tr>
<td/>
<td valign="top" align="center"><italic>G. elata</italic> (This study)</td>
<td valign="top" align="center">(<xref ref-type="bibr" rid="B44">Yuan et al., 2018</xref>)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Sequencing platform</td>
<td valign="top" align="center">Illumina Hiseq 2000</td>
<td valign="top" align="center">Illumina Hiseq 2500</td>
</tr>
<tr>
<td valign="top" align="left">Sequenced data (Gb)</td>
<td valign="top" align="center">483.07</td>
<td valign="top" align="center">179.1</td>
</tr>
<tr>
<td valign="top" align="left">Genome coverage (&#x00D7;)</td>
<td valign="top" align="center">350.56</td>
<td valign="top" align="center">151.78</td>
</tr>
<tr>
<td valign="top" align="left">Estimated genome size (Gb)</td>
<td valign="top" align="center">1.37</td>
<td valign="top" align="center">1.18</td>
</tr>
<tr>
<td valign="top" align="left">Assembled genome (Gb)</td>
<td valign="top" align="center">1.12</td>
<td valign="top" align="center">1.06</td>
</tr>
<tr>
<td valign="top" align="left">Contig N50 (Kb)</td>
<td valign="top" align="center">110.03</td>
<td valign="top" align="center">68.97</td>
</tr>
<tr>
<td valign="top" align="left">Scaffold N50 (Mb)</td>
<td valign="top" align="center">1.64</td>
<td valign="top" align="center">4.91</td>
</tr>
<tr>
<td valign="top" align="left">TE proportion (%)</td>
<td valign="top" align="center">69.81%</td>
<td valign="top" align="center">66.18%</td>
</tr>
<tr>
<td valign="top" align="left">Total BUSCO groups searched</td>
<td valign="top" align="center">303</td>
<td valign="top" align="center">956</td>
</tr>
<tr>
<td valign="top" align="left">Complete BUSCOs</td>
<td valign="top" align="center">81.85%</td>
<td valign="top" align="center">67.15%</td>
</tr>
<tr>
<td valign="top" align="left">Duplicated BUSCOs</td>
<td valign="top" align="center">17.49%</td>
<td valign="top" align="center">9.21%</td>
</tr>
<tr>
<td valign="top" align="left">Fragmented BUSCOs</td>
<td valign="top" align="center">3.96%</td>
<td valign="top" align="center">4.39%</td>
</tr>
<tr>
<td valign="top" align="left">Missing BUSCOs</td>
<td valign="top" align="center">14.19%</td>
<td valign="top" align="center">28.45%</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
<sec id="S2.SS3">
<title>RNA-Sequencing Data Analysis</title>
<p>Overall, 82.37 million transcriptome raw reads were obtained from <italic>G. elata</italic> leaf, stem, and tuber tissues (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 2</xref>). First, all RNA-sequencing (RNA-seq) data were filtered by the strict quality control process, then about 74.59 millions cleaned reads were <italic>de novo</italic> assembled using trinity<sup><xref ref-type="fn" rid="footnote4">4</xref></sup> (<xref ref-type="bibr" rid="B9">Grabherr et al., 2011</xref>) with default settings to yield transcripts that prepared for the genome annotation. Next, all RNA-seq reads were mapped to the <italic>G. elata</italic> genome assembly using the TopHat2 (version 2.0.14; see text footnote 3) (<xref ref-type="bibr" rid="B35">Trapnell et al., 2009</xref>) with default settings. The fragments per kilobase of exon model per million reads mapped (FPKM) of each predicted protein-coding gene was calculated by the Cufflinks<sup><xref ref-type="fn" rid="footnote5">5</xref></sup> using default parameters. FPKM &#x003E; = 0.05 was set as the threshold to identify expressed genes.</p>
</sec>
<sec id="S2.SS4">
<title>Repeat Sequence Annotation</title>
<p>RepeatMasker (version 3.2.6) with the Repbase TE library was used to identify known transposable elements (TEs) with the default parameters. The library was constructed by generating the consensus sequence of each TE family, which was used for the RepeatMasker to identify additional high and medium copy repeats in the <italic>G. elata</italic> genome assembly. TRF with parameters set to &#x201C;Match = 2, Mismatch = 7, Delta = 7, PM = 80, PI = 10, Minscore = 50, and MaxPeriod = 2000&#x201D; was used to predict tandem repeats.</p>
</sec>
<sec id="S2.SS5">
<title>Protein-Coding Gene Annotation</title>
<p>A combination of <italic>de novo</italic>-, transcriptome-based prediction, and homology aligning were used to process gene annotation. Gene sets from ten species (<italic>Arabidopsis thaliana</italic>, <italic>Brachypodium distachyon</italic>, <italic>Oryza sativa</italic>, <italic>Sorghum bicolor</italic>, <italic>Solanum tuberosum</italic>, <italic>Triticum aestivum</italic>, <italic>Hordeum vulgare</italic>, <italic>P. equestris</italic>, <italic>Dendrobium catenatum</italic>, and <italic>A. shenzhenica</italic>) were used for homology-based predictions, one species at a time. We used the TBLASTN to search the non-redundant protein sequences of each gene set with an E-value &#x003C; 1e-2. Only regions with homologous blocks longer than 80% of the query protein were retained. The best hits were selected. Then, the EVM was used to construct the gene structures. After repeat sequences were masked using the homology-based approach, three softwares, AUGUSTUS (<xref ref-type="bibr" rid="B34">Stanke et al., 2006</xref>), SNAP (<xref ref-type="bibr" rid="B15">Korf, 2004</xref>), and GlimmerHMM (<xref ref-type="bibr" rid="B26">Majoros et al., 2004</xref>), were used for the genes <italic>de novo</italic> prediction. Information obtained from the homology-based predictions and <italic>de novo</italic> predictions were then integrated in the GLEAN to generate a consensus gene set. Finally, RNA-seq data from a single <italic>G. elata</italic> plant&#x2019;s flower, stem, and tuber tissues were obtained and assembled for the facilitating of the protein-coding gene annotation.</p>
</sec>
<sec id="S2.SS6">
<title>Functional Annotation</title>
<p>Best hits were selected from alignments to the SwissProt and TrEMBL databases to assign gene function information. Gene motifs and domains were identified using the InterProScan5<sup><xref ref-type="fn" rid="footnote6">6</xref></sup> (<xref ref-type="bibr" rid="B14">Jones et al., 2014</xref>) by alignment to databases including the ProDom, PRINTS, Pfam, SMART, PANTHER, and PROSITE. According to the corresponding SwissProt and TrEMBL entries information, Gene Ontology (GO) terms and ID for each gene was obtained. Kyoto Encyclopedia of Genes and Genomes (KEGG) protein database was used as reference for gene alignments to obtain KEGG IDs as well as the corresponding pathways information.</p>
</sec>
<sec id="S2.SS7">
<title>Gene Family Clustering</title>
<p>All proteins from selected 13 species (<italic>Gastodia elata</italic>, <italic>P. equestris</italic>, <italic>D. officinale</italic>, <italic>D. catenatum</italic>, <italic>A. shenzhenica</italic>, <italic>B. distachyon</italic>, <italic>O. sativa</italic>, <italic>S. bicolor</italic>, <italic>Spirodela polyrhiza</italic>, <italic>Musa acuminata, A. thaliana</italic>, <italic>Populus trichocarpa</italic>, and <italic>Vitis vinifera</italic>) were aligned using the BLASTP, then, the gene families were defined using the OrthoMCL (<xref ref-type="bibr" rid="B22">Li et al., 2003</xref>). CAF&#x00C9; (<xref ref-type="bibr" rid="B6">De Bie et al., 2006</xref>) was then used to identify gene family expansions and contractions in <italic>G. elata.</italic> To identify gene family clusters in these species and <italic>G. elata</italic>, we performed all-versus-all protein alignments using the BLASTP with the E-value threshold set to &#x201C;1e-5.&#x201D; We used the OrthoMCL to process high scoring segment pairs. The MCL module from OrthoMCL was then used to define final paralogous and orthologous genes with the parameter set as &#x201C;&#x2212;abc &#x2013;I = 1.5&#x201D;.</p>
</sec>
<sec id="S2.SS8">
<title>Phylogenetic Tree Construction and Divergence Time Estimation</title>
<p>Those single-copy orthologs identified from gene family cluster analysis of the aforementioned species were used to construct a phylogenetic tree. MUSCLE version 3.6<sup><xref ref-type="fn" rid="footnote7">7</xref></sup> (<xref ref-type="bibr" rid="B8">Edgar, 2004</xref>) was used with default settings to perform multiple sequence alignments. Fourfold degenerate sites of genes were collected and concatenated into a &#x201C;super sequence&#x201D; for each species. We used the MrBayes<sup><xref ref-type="fn" rid="footnote8">8</xref></sup> (<xref ref-type="bibr" rid="B12">Huelsenbeck and Ronquist, 2001</xref>) to reconstruct phylogenetic trees between species. The &#x201C;MCMCTREE&#x201D; module from the PAML package<sup><xref ref-type="fn" rid="footnote9">9</xref></sup> (<xref ref-type="bibr" rid="B43">Yang, 2007</xref>) was used to estimate the divergence time among species.</p>
</sec>
<sec id="S2.SS9">
<title>Chloroplast Genome (Plastome) Assembly and Annotation</title>
<p>The clean reads were aligned to the plastomes of <italic>P. equestris</italic> and <italic>D. officinale</italic> (<xref ref-type="bibr" rid="B13">Jheng et al., 2012</xref>; <xref ref-type="bibr" rid="B42">Yang et al., 2016</xref>) using the bowtie2 with default settings, respectively. Reads extracted from the &#x201C;paired-aligned&#x201D; alignments were merged and assembled using the SOAPdenovo with default parameters. Contigs shorter than 100 bp were excluded. Filtered contigs were joined to scaffolds based on the paired-end information and gaps between scaffolds were closured. DOGMA<sup><xref ref-type="fn" rid="footnote10">10</xref></sup> (<xref ref-type="bibr" rid="B40">Wyman et al., 2004</xref>) was used to annotate the protein-coding genes and tRNA genes with the cut-off set to 80%. The boundaries of protein-coding genes and plastome structures were manually checked by comparison to the plastomes of <italic>P. equestris</italic> and <italic>D. officinale</italic>. The linear plot of <italic>G. elata</italic> plastome was yielded by the OGDRAW<sup><xref ref-type="fn" rid="footnote11">11</xref></sup> (<xref ref-type="bibr" rid="B25">Lohse et al., 2013</xref>), followed with some manual adjustments.</p>
</sec>
<sec id="S2.SS10">
<title>Relaxation Selection Analyses and Symbiotic Gene Analysis</title>
<p>These nuclear-encoded photosynthesis-related proteins were identified based on the National Center for Biotechnology Information (NCBI) database. Genome sequences of seven species (<italic>G. elata, A. shenzhenica, P. equestris, D. catenatum, D. officinale, O. sativa</italic>, and <italic>A. thaliana</italic>) were searched for all of the known plant nuclear-encoded photosynthesis-related genes. Only genes that were in a one-to-one orthologs for every pair of genomes of the seven species were used in our analyses. For genes that have more than one transcript, we aligned all of the possible transcript pairs to all seven species and retained those that provided the highest alignment scores. Alignments and consensus trees were used for posterior molecular evolutionary analysis. We used a gene-level approach based on the ratio of non-synonymous (<italic>K</italic><sub><italic>a</italic></sub>) to synonymous (<italic>K</italic><sub><italic>s</italic></sub>) substitutions rate (&#x03C9; = <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub>) to identify potential relaxation of selective constraints, using the CODEML likelihood ratio tests (LRTs) algorithm from the PAML package. First, we tested branch models M0, the simplest model, which has a single &#x03C9; ratio for the entire tree. Subsequently, we used two-ratio models that allow a background &#x03C9; ratio and a different &#x03C9; on the branch of interest. For null hypotheses, we used the one-ratio model, two-ratio model, and more models with a fixed &#x03C9; = 1 on the branch under analysis. The level of significance for these LRTs was calculated using a &#x03C7;<sup>2</sup> approximation, where twice the difference of log likelihood between the models (2&#x0394;lnL) would be asymptotic to a &#x03C7;<sup>2</sup> distribution, with the number of degrees of freedom corresponding to the difference in the number of parameters between the nested models.</p>
<p>These Gastrodia antifungal protein (GAFP) were downloaded from the NCBI database. Genome sequences of seven species (<italic>G. elata, A. shenzhenica, P. equestris, D. catenatum, D. officinale, O. sativa</italic>, and <italic>A. thaliana</italic>) were searched for all of the known GAFP genes with blast software. Finally, the genes with E-value &#x2264; 1e-6 in the comparison result were selected as a candidate GAFP gene. And the protein domain of carotenoid cleavage dioxygenases (CCDs) was downloaded from the pfam website. The hmmersearch software were used for sequence alignment to identify CCDs genes in other species. The identified genes are calculated by <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> to verify whether positive selection occurred in <italic>G. elata</italic>.</p>
</sec>
<sec id="S2.SS11">
<title>High Performance Liquid Chromatography Analysis of Photosynthetic Pigments</title>
<p>From each sample of <italic>G. elata</italic>&#x2019;s vestigial scalelike leaves and <italic>P. equestris</italic>&#x2019;s and <italic>D. Officinale</italic>&#x2019;s normal leaves, about 1 g of leave tissue was collected and dried as powder. Then, the dried powder was dealt with 100% 40 mL of methanol for half an hour and sonicated for an hour, and then, methanol diluted to 50 mL. The methanol extract was then filtered by the 0.45 &#x03BC;m membrane filter. Ten microliters of filtrate was prepared for high performance liquid chromatography (HPLC). Quantitative analysis of the photosynthetic pigments of three species was performed using the chromatographic column Inertsil ODS-3 (250 mm &#x00D7; 4.6 mm, 5 &#x03BC;m) and the column temperature was maintained at 25&#x00B0;C with the flow rate set as 1 mL &#x00D7; min<sup>&#x2013;1</sup>. The mobile phase was consisted of A: acetonitrile and 0.05 mol/L of Tris&#x2013;HC1 buffer (70:3); and B: methanol and n-hexane (5:1). Gradient elution was then used with the following system: 100% A at initiation, 100% A at 18 min, 100% B at 20.5 min, and 100% B at 46 min. 445 nm was used to detect photosynthetic pigments.</p>
</sec>
</sec>
<sec id="S3">
<title>Results</title>
<sec id="S3.SS1">
<title>De novo Assembly of the <italic>G. elata</italic> Genome</title>
<p>The genome size of <italic>G. elata</italic> was estimated to be 1.378 Gb using the <italic>K</italic>-mer distribution analysis (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 2</xref>). All 483.07 Gb clean data (350.56 &#x00D7; genome coverage) were <italic>de novo</italic> assembled into 69,353 contigs (1.11 Gb in total length) with a contig N50 size of 110.03 kb, and 45,884 scaffolds (1.12 Gb in total length) with a scaffold N50 size of 1.64 Mb (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 3</xref>). As a result of high genome coverage, our <italic>G. elata</italic> assembly had a much longer contig N50 size (110.03 kb) than that from a previous study (68.9 kb, <xref ref-type="table" rid="T1">Table 1</xref>; <xref ref-type="bibr" rid="B44">Yuan et al., 2018</xref>). Preliminary evaluation of the quality of our assembly showed that at least 92% of the clean reads from different insert-sizes of paired-end libraries could be mapped back to the assembled genome (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 4</xref>). In addition, over 82.37 million RNA sequencing reads from each of the flower, stem, and tuber tissues were generated to further verify the quality of the assembly. The overall mapping ratios of these reads to the genome assembly were 90.7% for the flower, 93.8% for the stem, and 67.1% for the tuber (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 2</xref>), indicating the high quality of the <italic>G. elata</italic> genome.</p>
<p>The completeness of the genic regions and other genomic elements in our <italic>G. elata</italic> genome was evaluated by the BUSCOs approach (<xref ref-type="bibr" rid="B37">Waterhouse et al., 2017</xref>). The result showed that 248 out of 303 (81.85%) near-universal single-copy orthologs were identified in our <italic>G. elata</italic> genome. This number was much higher than that reported in the previous study (67.15% BUSCO completeness, <xref ref-type="table" rid="T1">Table 1</xref>; <xref ref-type="bibr" rid="B44">Yuan et al., 2018</xref>). Additionally, 12 BUSCO genes (3.96%) had fragmented matches, and 43 BUSCO genes (14.19%) were missing in our assembly. Both parameters were lower than that reported in the previous study (4.39 and 28.45%, respectively, <xref ref-type="table" rid="T1">Table 1</xref>; <xref ref-type="bibr" rid="B44">Yuan et al., 2018</xref>). These data demonstrated that our <italic>G. elata</italic> genome had a much higher completeness for subsequent functional analysis.</p>
</sec>
<sec id="S3.SS2">
<title><italic>Gastrodia elata</italic> Genome Repeat Analysis</title>
<p>Repetitive DNA elements constituted approximately 68.34% of the acquired genome (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 5</xref>). This proportion was higher than those of the other orchids genomes, including <italic>P. equestris</italic> (62%) (<xref ref-type="bibr" rid="B3">Cai et al., 2015</xref>), <italic>D. officinale</italic> (63.33%) (<xref ref-type="bibr" rid="B23">Liang et al., 2015</xref>), and <italic>A. shenzhenica</italic> (42.05%) (<xref ref-type="bibr" rid="B45">Zhang et al., 2017</xref>). Long interspersed nuclear elements (LINEs) and DNA transposons constituted 6.20 and 7.49% of the total genome assembly, respectively (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 5</xref>). The long terminal repeats (LTRs) were the most abundant TEs, which constituted 59.95% of the genome (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 5</xref>). Notably, Gypsy-type (37.41%) and Copia-type (8.07%) TEs accounted for most of the LTRs (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 6</xref>). Sequence divergence line plot of Copia and Gypsy types of TEs shows that both of the two types experienced two recently expansion events during the same periods (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 3a</xref>). Compared to the conserved single copy genes, those duplicated genes (&#x201C;accessory genes&#x201D;) in <italic>G. elata</italic> are located closer to the TEs (Fisher&#x2019;s exact test, <italic>P</italic> &#x003C; 0.005), suggesting their contribution in gene copy number variation and the important role in <italic>G. elata</italic> evolution (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 3b</xref>).</p>
</sec>
<sec id="S3.SS3">
<title>Orthologous Gene Analysis in the <italic>G. elata</italic> Genome</title>
<p>Overall, we identified 24,484 protein-coding genes (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 7</xref>) with about 10.05 kb average length in the <italic>G. elata</italic> genome that belonged to 11,065 unique gene families (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 8</xref>). Besides, we also identified a myriad of microRNAs (1,125), transfer RNAs (1,123), ribosomal RNAs (1,596), and small nuclear RNAs (868; <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 9</xref>) in the <italic>G. elata</italic> genome.</p>
<p>Phylogenetic analysis with divergence time estimation showed that the <italic>G. elata</italic> diverged from other orchids somewhere between 72.3 and 55.8 million years ago (Mya) (<xref ref-type="fig" rid="F1">Figure 1B</xref>). During the course of evolution, it is apparent that 19 gene families were significantly expanded (<italic>P</italic> &#x003C; 0.001; <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 10</xref>), whereas six gene families were significantly contracted in the <italic>G. elata</italic> genome (<italic>P</italic> &#x003C; 0.001; <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 11</xref>). KEGG enrichment analyses showed that gene families involved in flavonoid biosynthesis, plant-pathogen interaction, and circadian rhythm were significantly contracted in the <italic>G. elata</italic> genome (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 12</xref>). In comparison, the expanded gene families are mainly involved in the glycan, sphingolipid, and galactose metabolisms, and intriguingly, also plant-pathogen interaction (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 13</xref>). Since some members of the plant-pathogen interaction gene families were contracted and other members were expanded, it is possible that <italic>G. elata</italic> may have rewired its pathogen resistance pathway when adapting to the low-light environment. Indeed, <italic>G. elata</italic> as a fully mycoheterotrophic plant not only needs to obtain nutrients from the fungi associates, but also have to prevent the fungi from invading into the inner most section of the tuber (<xref ref-type="bibr" rid="B46">Zhang, 1980</xref>).</p>
</sec>
<sec id="S3.SS4">
<title><italic>Gastrodia elata</italic> Plastome Assembly and Relaxed Selection of Plastid Genes</title>
<p>The conserved plastome structure of most land plants generally is a quadripartite single circular molecule of 100&#x2013;220 kb. It consists of a small and a large single-copy regions (SSC and LSC) which are separated by a pair of inverted repeats (IRs) (<xref ref-type="bibr" rid="B33">Sandelius and Aronsson, 2009</xref>). The plastome of the photosynthetic plant harbors around 100 essential genes that primarily encode RNAs and proteins involved in photosynthesis, transcription, and translation (<xref ref-type="bibr" rid="B5">Daniell et al., 2016</xref>). <italic>P. equestris</italic> and <italic>D. officinale</italic> are two photosynthetic orchids with fully functional plastomes as other land plants (<xref ref-type="bibr" rid="B13">Jheng et al., 2012</xref>; <xref ref-type="bibr" rid="B42">Yang et al., 2016</xref>). The plastomes of these two orchids (with sizes of 148,959 and 152,018 bp, respectively) both have the typical quadripartite single circular molecule structure with relatively complete photosynthesis-related gene sets (<xref ref-type="fig" rid="F2">Figure 2</xref>). In comparison, the plastome of <italic>G. elata</italic> was assembled with the size of 40,037 bp, meaning that more than two thirds of the plastome sequence was lost after the transition to a low-light heterotrophic lifestyle (<xref ref-type="fig" rid="F2">Figure 2</xref>). IRs are considered to play roles in plastome stabilization (<xref ref-type="bibr" rid="B30">Palmer and Thompson, 1982</xref>). In the <italic>G. elata</italic> plastome, one copy of IR was completely lost, and the remaining IR sequence was less than half the size of its counterparts in the other two orchids. The <italic>G. elata</italic> LSC retained less than a quarter of the sequence size compared to the two orchid plastomes, and the <italic>G. elata</italic> SSC also lost half of its size.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Plastid map of three orchid plants. The plastid of <italic>G. elata</italic> shows significant degradation comparing with <italic>P. equestris</italic> and <italic>D. officinale</italic>. &#x03A8; indicates the pseudogenes.</p></caption>
<graphic xlink:href="fgene-11-580568-g002.tif"/>
</fig>
<p>Only 50 genes were identified in the <italic>G. elata</italic> plastome, among which 10 genes were manually checked to be pseudogenes (with frameshifts or premature stop codons) (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 14</xref>). The photosynthesis-related genes in the <italic>G. elata</italic> plastome were carefully checked. The result showed that the paralogs of <italic>psa</italic> and <italic>psb</italic> (photosystem I and II genes), <italic>pet</italic> (cytochrome b/f complex genes), <italic>rbc</italic> (rubisco subunit genes), and <italic>atp</italic> (ATP synthase genes) were completely lost or were found to have incomplete gene structures due to a reduced LSC. Two of the six remaining <italic>ndh</italic> (NADH dehydrogenase) genes were found to be non-functional. All these changes concluded that the genomic basis of photosynthesis in the <italic>G. elata</italic> plastome was highly degenerated. These observations are in accordance with a previous report (<xref ref-type="bibr" rid="B44">Yuan et al., 2018</xref>), which includes small assembled plastome sizes (40,026 vs. 35,326 bp), extensively loss of DNA fragments, missing of one copy of IR structure, and loss or non-functional of photosynthesis-related genes.</p>
<p>Natural selection is essential in the maintenance of trait for the plant population. The weakening or disappear of selection strength that leads to trait variations is referred to as &#x201C;relaxed selection&#x201D; (<xref ref-type="bibr" rid="B18">Lahti et al., 2009</xref>). In its evolutionary history, <italic>G. elata</italic> experienced the transition to a low-light, undergrowth environment (<xref ref-type="bibr" rid="B2">Bidartondo, 2005</xref>) and a fully heterotrophic lifestyle. This transition made photosynthesis dispensable for <italic>G. elata</italic> to survive. We therefore hypothesized that the remaining photosynthesis-related plastome genes might be under relaxed selection. Indeed, the <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> values of these genes (includes <italic>psa</italic>, <italic>psb</italic>, <italic>atp</italic>, <italic>pet</italic> genes, and so on) in <italic>G. elata</italic> were higher than <italic>D. officinale</italic> and <italic>P. equestris</italic>, and non-orchid plant species (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 15</xref>). This indicates the reduction of functional constraints, and, thus, these genes were under a significantly different selective regime in <italic>G. elata</italic> than in those photosynthetically active species.</p>
</sec>
<sec id="S3.SS5">
<title>Relaxation of Selective Constraints of Nuclear-Coded Photosynthesis-Related Genes in <italic>G. elata</italic></title>
<p>We define &#x201C;photosynthesis-related genes&#x201D; as all known genes that are involved in the structure, development, and normal function of the plastid and leaf in land plants. The plastome only contains a small part of these photosynthesis-related genes, and the rest are within the plant nuclear genome. Based on the aforementioned hypothesis, we also checked the molecular evolution of the photosynthesis-related nuclear genes in the <italic>G. elata</italic> genome. In brief, they consisted of 4,818 plastid-related genes, 203 leaf development-related genes, and 1,408 genes that were directly involved in the photosynthesis. The <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> values of these genes in <italic>G. elata</italic> were significantly higher than those in other orchids and non-orchid plant species, indicating relaxation of selective constraints on the leaf development and the photosynthesis process (<italic>t</italic>-test and two-way ANOVA test, <italic>p</italic> &#x003C; 0.05, <xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 4</xref>). We also found that the <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> values of these searched genes in orchids were higher than those in non-orchid species. It suggested that there might be a partial relaxation of selection on plastid and leave functions in the photosynthetic orchids due to their symbiotic relationships with fungi. These findings also suggested a positive correlation between the degree of heterotrophy in plants and the non-synonymous mutation rates in genes that were involved in the photosynthetic process, plastid and leave functions.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Relaxation of selective constraints on nuclear-encoded genes. <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> ratios of nuclear-encoded plastid genes and genes involved in leaf development in <italic>G. elata</italic>, other orchids (including <italic>D. officinale</italic>, <italic>P. equestris</italic>, <italic>D. catenatum</italic>, and <italic>A. shenzhenica</italic>) and other green plants (including <italic>A. thaliana</italic> and <italic>O. sativa</italic>). &#x002A;<italic>P</italic> &#x003C; 0.05.</p></caption>
<graphic xlink:href="fgene-11-580568-g003.tif"/>
</fig>
</sec>
<sec id="S3.SS6">
<title>Analysis of Symbiotic Genes in <italic>G. elata</italic> Genome</title>
<p>Since <italic>G. elata</italic> cannot perform photosynthesis, it relies on symbiotic genes for nutrition, so symbiotic genes are also attracting attention in the <italic>Analysis of Symbiotic Genes in Gastrodia Genome</italic>. <italic>G. elata</italic> exists underground without leaves and chloroplasts, with the nutrients necessary for growth being supplied by the symbiotic fungus <italic>Armillaria mellea</italic> (<xref ref-type="bibr" rid="B32">Sa et al., 2003</xref>) fungus. Gastrodia antifungal protein (GAFP, also known as gastrodianin) was first purified from the cortex of the terminal corm of <italic>G. elata</italic> (<xref ref-type="bibr" rid="B11">Hu et al., 1988</xref>). It is mainly distributed throughout the epidermis and cortex layer of <italic>G. elata</italic> (<xref ref-type="bibr" rid="B24">Liu et al., 1993</xref>; <xref ref-type="bibr" rid="B10">Hu and Huang, 1994</xref>) and shows a strong fungistatic activity against a broad spectrum of fungi, including <italic>A. mellea</italic> (<xref ref-type="bibr" rid="B10">Hu and Huang, 1994</xref>), <italic>Rhizoctonia solani</italic>, <italic>Valsa ambiens</italic>, <italic>Gibberella zeae</italic>, <italic>Ganoderma lucidum</italic>, and <italic>Botrytis cinerea in vitro</italic> to reach plants symbiosis with microorganisms (<xref ref-type="bibr" rid="B36">Wang et al., 2001</xref>). In the <italic>G. elata</italic> genome, we identified 20 GAFP genes, 10 GAFP genes in <italic>A. shenzhenica</italic>, and 0 in <italic>A. thaliana</italic>, which indicates that GAFP has expanded in <italic>G. elata</italic> (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 16</xref>). It is known that strigolactone can stimulate hyphal branching and development of arbuscular mycorrhizal fungi, which increases the chances of an encounter with a host plant (<xref ref-type="bibr" rid="B17">Kretzschmar et al., 2012</xref>). Strigolactone is an important signal for the establishment of the symbiosis relationship between <italic>G. elata</italic> and <italic>A. mellea</italic>. Its mechanism of action is similar to that of promoting symbiosis between plants and mycorrhiza. In this article, we have identified the key genes for the biosynthesis of strigolactone CCDs (<xref ref-type="bibr" rid="B7">Delaux et al., 2012</xref>). In the <italic>G. elata</italic> genome, 12 CCDs genes were identified, whereas ten and nine CCDs genes were identified in <italic>A. shenzhenica</italic> and <italic>A. thaliana</italic>, respectively. In order to verify whether the CCDs gene has positive selection in <italic>G. elata</italic>, we further performed the <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> analysis. The <italic>K</italic><sub><italic>a</italic></sub>/<italic>K</italic><sub><italic>s</italic></sub> values of these genes in <italic>G. elata</italic> were significantly higher than those in <italic>D. catenatum</italic> and <italic>P. equestris</italic>. It showed that, compared with some orchid and non-orchid plant species, CCDs have expanded in the <italic>G. elata</italic> genome.</p>
</sec>
<sec id="S3.SS7">
<title>Genomic Basis for the Achlorophyllous Phenotype in <italic>G. elata</italic></title>
<p>We next investigated nuclear-encoded genes involved in the plant pigment synthesis in the <italic>G. elata</italic> genome. We detected no copies of four core genes in the chlorophyll biosynthetic pathway (<italic>UROS</italic>, <italic>CAO</italic>, <italic>LPOR</italic>, and <italic>VDE</italic>; <xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 5a</xref>). This is in line with the result that no signals of major photosynthetic pigments could be detected via the HPLC in the <italic>G. elata</italic> plant tissue (compared to the other two orchids <italic>D. officinale</italic> and <italic>P. equestris</italic>) (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 5b</xref>). Moreover, three essential genes (<italic>PDV1</italic>, <italic>PDV2</italic>, and <italic>ARC3</italic>) involved in the chloroplast division were also not detected (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 6</xref>). These results clearly showed the genomic basis for the achlorophyllous phenotype in <italic>G. elata</italic>.</p>
</sec>
</sec>
<sec id="S4">
<title>Conclusion</title>
<p>The <italic>G. elata</italic> genome provides an illuminating model for probing evolutionary molecular changes associated with leaf loss, plastid degeneration, and plant-fungal symbioses. Both plastid-encoded and nuclear-encoded photosynthesis-related genes in <italic>G. elata</italic> showed evidence of the relaxation of selective constraints. Besides the profound changes in the photosynthetic system, it is possible that future research could identify the underlying mechanisms for the rewiring of basic metabolic pathways, the evolution of TEs, gene death, and generation of new genes, since an improved <italic>G. elata</italic> genome is now available. Thus, the genome sequence of <italic>G. elata</italic> would be a valuable resource for future investigations of the evolution of orchids and non-photosynthetic plants at both the genomic and the whole-organism levels.</p>
</sec>
<sec id="S5">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: NCBI database under BioProject <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA394702">PRJNA394702</ext-link>.</p>
</sec>
<sec id="S6">
<title>Author Contributions</title>
<p>SSC, GHZ, and WLS collected the samples and performed the experiments. XW, YZW, and XD completed the data analysis. YD, WC, WW, MA, and JHM edited and modified the manuscript. All authors read and approved the manuscript.</p>
</sec>
<sec id="conf1">
<title>Conflict of Interest</title>
<p>XW was employed by the company Jiaxing Synbiolab Biotechnology Co., Ltd. and she declared that Jiaxing Synbiolab Biotechnology Co., Ltd. plays no role in the funding, design, analysis, and publication of this manuscript. The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This study was supported by &#x201C;The Thousand Talents Program&#x201D; (Class B) of the government of China, National Key R&#x0026;D Program of China (2019YFC1711100), Yunnan Provincial Key Programs of Yunnan Eco-friendly Food International Cooperation Research Center Project (2019ZG00908), and the Guangxi Innovation-Driven Development Project (GuiKe AA18242040).</p>
</fn>
</fn-group>
<sec id="S8" sec-type="supplementary material"><title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2020.580568/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2020.580568/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.PDF" id="FS1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.xlsx" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barrett</surname> <given-names>C. F.</given-names></name> <name><surname>Davis</surname> <given-names>J. I.</given-names></name></person-group> (<year>2012</year>). <article-title>The plastid genome of the mycoheterotrophic <italic>Corallorhiza striata</italic> (Orchidaceae) is in the relatively early stages of degradation.</article-title> <source><italic>Am. J. Bot.</italic></source> <volume>99</volume> <fpage>1513</fpage>&#x2013;<lpage>1523</lpage>. <pub-id pub-id-type="doi">10.3732/ajb.1200256</pub-id> <pub-id pub-id-type="pmid">22935364</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bidartondo</surname> <given-names>M. I.</given-names></name></person-group> (<year>2005</year>). <article-title>The evolutionary ecology of myco-heterotrophy.</article-title> <source><italic>New Phytol.</italic></source> <volume>167</volume> <fpage>335</fpage>&#x2013;<lpage>352</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.2005.01429.x</pub-id> <pub-id pub-id-type="pmid">15998389</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cai</surname> <given-names>J.</given-names></name> <name><surname>Liu</surname> <given-names>X.</given-names></name> <name><surname>Vanneste</surname> <given-names>K.</given-names></name> <name><surname>Proost</surname> <given-names>S.</given-names></name> <name><surname>Tsai</surname> <given-names>W. C.</given-names></name> <name><surname>Liu</surname> <given-names>K. W.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>The genome sequence of the orchid <italic>Phalaenopsis equestris</italic>.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>47</volume> <fpage>65</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3149</pub-id> <pub-id pub-id-type="pmid">25420146</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cribb</surname> <given-names>P.</given-names></name> <name><surname>Killmann</surname> <given-names>E. F. A. D.</given-names></name></person-group> (<year>2010</year>). <article-title>A revision of Gastrodia (Orchidaceae: Epidendroideae, Gastrodieae) in tropical Africa.</article-title> <source><italic>Kew Bull.</italic></source> <volume>65</volume> <fpage>315</fpage>&#x2013;<lpage>321</lpage>. <pub-id pub-id-type="doi">10.1007/s12225-010-9193-4</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Daniell</surname> <given-names>H.</given-names></name> <name><surname>Lin</surname> <given-names>C. S.</given-names></name> <name><surname>Yu</surname> <given-names>M.</given-names></name> <name><surname>Chang</surname> <given-names>W. J.</given-names></name></person-group> (<year>2016</year>). <article-title>Chloroplast genomes: diversity, evolution, and applications in genetic engineering.</article-title> <source><italic>Genome Biol.</italic></source> <volume>17</volume>:<issue>134</issue>. <pub-id pub-id-type="doi">10.1186/s13059-016-1004-2</pub-id> <pub-id pub-id-type="pmid">27339192</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Bie</surname> <given-names>T.</given-names></name> <name><surname>Cristianini</surname> <given-names>N.</given-names></name> <name><surname>Demuth</surname> <given-names>J. P.</given-names></name> <name><surname>Hahn</surname> <given-names>M. W.</given-names></name></person-group> (<year>2006</year>). <article-title>CAFE: a computational tool for the study of gene family evolution.</article-title> <source><italic>Bioinformatics</italic></source> <volume>22</volume> <fpage>1269</fpage>&#x2013;<lpage>1271</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btl097</pub-id> <pub-id pub-id-type="pmid">16543274</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Delaux</surname> <given-names>P. M.</given-names></name> <name><surname>Xie</surname> <given-names>X.</given-names></name> <name><surname>Timme</surname> <given-names>R. E.</given-names></name> <name><surname>Puech-Pages</surname> <given-names>V.</given-names></name> <name><surname>Dunand</surname> <given-names>C.</given-names></name> <name><surname>Lecompte</surname> <given-names>E.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Origin of strigolactones in the green lineage.</article-title> <source><italic>New Phytol.</italic></source> <volume>195</volume> <fpage>857</fpage>&#x2013;<lpage>871</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.2012.04209.x</pub-id> <pub-id pub-id-type="pmid">22738134</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Edgar</surname> <given-names>R. C.</given-names></name></person-group> (<year>2004</year>). <article-title>MUSCLE: multiple sequence alignment with high accuracy and high throughput.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>1792</fpage>&#x2013;<lpage>1797</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh340</pub-id> <pub-id pub-id-type="pmid">15034147</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Yassour</surname> <given-names>M.</given-names></name> <name><surname>Levin</surname> <given-names>J. Z.</given-names></name> <name><surname>Thompson</surname> <given-names>D. A.</given-names></name> <name><surname>Amit</surname> <given-names>I.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>29</volume> <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id> <pub-id pub-id-type="pmid">21572440</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>Q. Z.</given-names></name></person-group> (<year>1994</year>). <article-title>Induction and accumulation of the antifungal protein in <italic>Gastrodia elata</italic>.</article-title> <source><italic>Acta Bot. Yunnan</italic></source> <volume>16</volume> <fpage>169</fpage>&#x2013;<lpage>177</lpage>.</citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>Z.</given-names></name> <name><surname>Yang</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name></person-group> (<year>1988</year>). <article-title>Isolation and partial characterization of an antifungal protein from Gastrodia elata corm.</article-title> <source><italic>Acta Bot. Yunnanica</italic></source> <volume>10</volume> <fpage>373</fpage>&#x2013;<lpage>380</lpage>.</citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huelsenbeck</surname> <given-names>J. P.</given-names></name> <name><surname>Ronquist</surname> <given-names>F.</given-names></name></person-group> (<year>2001</year>). <article-title>MRBAYES: bayesian inference of phylogenetic trees.</article-title> <source><italic>Bioinformatics</italic></source> <volume>17</volume> <fpage>754</fpage>&#x2013;<lpage>755</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/17.8.754</pub-id> <pub-id pub-id-type="pmid">11524383</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jheng</surname> <given-names>C. F.</given-names></name> <name><surname>Chen</surname> <given-names>T. C.</given-names></name> <name><surname>Lin</surname> <given-names>J. Y.</given-names></name> <name><surname>Chen</surname> <given-names>T. C.</given-names></name> <name><surname>Wu</surname> <given-names>W. L.</given-names></name> <name><surname>Chang</surname> <given-names>C. C.</given-names></name></person-group> (<year>2012</year>). <article-title>The comparative chloroplast genomic analysis of photosynthetic orchids and developing DNA markers to distinguish <italic>Phalaenopsis orchids</italic>.</article-title> <source><italic>Plant Sci.</italic></source> <volume>190</volume> <fpage>62</fpage>&#x2013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1016/j.plantsci.2012.04.001</pub-id> <pub-id pub-id-type="pmid">22608520</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>P.</given-names></name> <name><surname>Binns</surname> <given-names>D.</given-names></name> <name><surname>Chang</surname> <given-names>H. Y.</given-names></name> <name><surname>Fraser</surname> <given-names>M.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>McAnulla</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>InterProScan 5: genome-scale protein function classification.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1236</fpage>&#x2013;<lpage>1240</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu031</pub-id> <pub-id pub-id-type="pmid">24451626</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Korf</surname> <given-names>I.</given-names></name></person-group> (<year>2004</year>). <article-title>Gene finding in novel genomes.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>5</volume>:<issue>59</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-5-59</pub-id> <pub-id pub-id-type="pmid">15144565</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krause</surname> <given-names>K.</given-names></name></person-group> (<year>2008</year>). <article-title>From chloroplasts to &#x201C;cryptic&#x201D; plastids: evolution of plastid genomes in parasitic plants.</article-title> <source><italic>Curr. Genet.</italic></source> <volume>54</volume> <fpage>111</fpage>&#x2013;<lpage>121</lpage>. <pub-id pub-id-type="doi">10.1007/s00294-008-0208-8</pub-id> <pub-id pub-id-type="pmid">18696071</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kretzschmar</surname> <given-names>T.</given-names></name> <name><surname>Kohlen</surname> <given-names>W.</given-names></name> <name><surname>Sasse</surname> <given-names>J.</given-names></name> <name><surname>Borghi</surname> <given-names>L.</given-names></name> <name><surname>Schlegel</surname> <given-names>M.</given-names></name> <name><surname>Bachelier</surname> <given-names>J. B.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>A petunia ABC protein controls strigolactone-dependent symbiotic signalling and branching.</article-title> <source><italic>Nature</italic></source> <volume>483</volume> <fpage>341</fpage>&#x2013;<lpage>344</lpage>. <pub-id pub-id-type="doi">10.1038/nature10873</pub-id> <pub-id pub-id-type="pmid">22398443</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lahti</surname> <given-names>D. C.</given-names></name> <name><surname>Johnson</surname> <given-names>N. A.</given-names></name> <name><surname>Ajie</surname> <given-names>B. C.</given-names></name> <name><surname>Otto</surname> <given-names>S. P.</given-names></name> <name><surname>Hendry</surname> <given-names>A. P.</given-names></name> <name><surname>Blumstein</surname> <given-names>D. T.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Relaxed selection in the wild.</article-title> <source><italic>Trends Ecol. Evol.</italic></source> <volume>24</volume> <fpage>487</fpage>&#x2013;<lpage>496</lpage>. <pub-id pub-id-type="doi">10.1016/j.tree.2009.03.010</pub-id> <pub-id pub-id-type="pmid">19500875</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lan</surname> <given-names>J.</given-names></name> <name><surname>Xu</surname> <given-names>J. T.</given-names></name> <name><surname>Li</surname> <given-names>J. S.</given-names></name></person-group> (<year>1994</year>). <article-title>Study on symbiotic relation between Gastrodia elata and Armillariella mellea by autoradiography.</article-title> <source><italic>Mycosystema</italic></source> <volume>13</volume> <fpage>219</fpage>&#x2013;<lpage>222</lpage>.</citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Langmead</surname> <given-names>B.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Fast gapped-read alignment with Bowtie 2.</article-title> <source><italic>Nat. Methods</italic></source> <volume>9</volume> <fpage>357</fpage>&#x2013;<lpage>359</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id> <pub-id pub-id-type="pmid">22388286</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leake</surname> <given-names>J. R.</given-names></name></person-group> (<year>1994</year>). <article-title>The biology of myco-heterotrophic (&#x2018;saprophytic&#x2019;) plants.</article-title> <source><italic>New Phytol.</italic></source> <volume>127</volume> <fpage>171</fpage>&#x2013;<lpage>216</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.1994.tb04272.x</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>L.</given-names></name> <name><surname>Stoeckert</surname> <given-names>C. J.</given-names></name> <name><surname>Roos</surname> <given-names>D. S.</given-names></name></person-group> (<year>2003</year>). <article-title>OrthoMCL: identification of ortholog groups for eukaryotic genomes.</article-title> <source><italic>Genome Res.</italic></source> <volume>13</volume> <fpage>2178</fpage>&#x2013;<lpage>2189</lpage>. <pub-id pub-id-type="doi">10.1101/gr.1224503</pub-id> <pub-id pub-id-type="pmid">12952885</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liang</surname> <given-names>Y.</given-names></name> <name><surname>Xiao</surname> <given-names>W.</given-names></name> <name><surname>Hui</surname> <given-names>L.</given-names></name> <name><surname>Yang</surname> <given-names>T.</given-names></name> <name><surname>Lian</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>The genome of dendrobium officinale illuminates the biology of the important traditional chinese orchid herb.</article-title> <source><italic>Mol. Plant</italic></source> <volume>008</volume> <fpage>922</fpage>&#x2013;<lpage>934</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2014.12.011</pub-id> <pub-id pub-id-type="pmid">25825286</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Jin-tang</surname> <given-names>X.</given-names></name> <name><surname>He</surname> <given-names>W.</given-names></name> <name><surname>Hong-xiang</surname> <given-names>L.</given-names></name> <name><surname>Yong-ru</surname> <given-names>S.</given-names></name></person-group> (<year>1993</year>). <article-title>Detection and immunofiuorescence localization of antifungal protein of gastrodiaelata.</article-title> <source><italic>J. Integr. Plant Biol.</italic></source> <volume>35</volume> <fpage>593</fpage>&#x2013;<lpage>599</lpage>.</citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lohse</surname> <given-names>M.</given-names></name> <name><surname>Drechsel</surname> <given-names>O.</given-names></name> <name><surname>Kahlau</surname> <given-names>S.</given-names></name> <name><surname>Bock</surname> <given-names>R.</given-names></name></person-group> (<year>2013</year>). <article-title>OrganellarGenomeDRAW&#x2013;a suite of tools for generating physical maps of plastid and mitochondrial genomes and visualizing expression data sets.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>41</volume> <fpage>W575</fpage>&#x2013;<lpage>W581</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt289</pub-id> <pub-id pub-id-type="pmid">23609545</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Majoros</surname> <given-names>W. H.</given-names></name> <name><surname>Pertea</surname> <given-names>M.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2004</year>). <article-title>TigrScan and GlimmerHMM: two open source ab initio eukaryotic gene-finders.</article-title> <source><italic>Bioinformatics</italic></source> <volume>20</volume> <fpage>2878</fpage>&#x2013;<lpage>2879</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bth315</pub-id> <pub-id pub-id-type="pmid">15145805</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Merckx</surname> <given-names>V.</given-names></name> <name><surname>Bidartondo</surname> <given-names>M. I.</given-names></name> <name><surname>Hynson</surname> <given-names>N. A.</given-names></name></person-group> (<year>2009</year>). <article-title>Myco-heterotrophy: when fungi host plants.</article-title> <source><italic>Ann. Bot.</italic></source> <volume>104</volume> <fpage>1255</fpage>&#x2013;<lpage>1261</lpage>. <pub-id pub-id-type="doi">10.1093/aob/mcp235</pub-id> <pub-id pub-id-type="pmid">19767309</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Merckx</surname> <given-names>V.</given-names></name> <name><surname>Freudenstein</surname> <given-names>J. V.</given-names></name></person-group> (<year>2010</year>). <article-title>Evolution of mycoheterotrophy in plants: a phylogenetic perspective.</article-title> <source><italic>New Phytol.</italic></source> <volume>185</volume> <fpage>605</fpage>&#x2013;<lpage>609</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.2009.03155.x</pub-id> <pub-id pub-id-type="pmid">20356335</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ning</surname> <given-names>Z.</given-names></name> <name><surname>Bai</surname> <given-names>X. F.</given-names></name> <name><surname>Jian-Tao</surname> <given-names>L. V.</given-names></name> <name><surname>Yang</surname> <given-names>J. F.</given-names></name> <name><surname>Gui-Ping</surname> <given-names>X. U.</given-names></name></person-group> (<year>2010</year>). <article-title>Study on symbiotic mechanism between gastrodia elata blume and armillaria mellea in tissue culture system.</article-title> <source><italic>Med. Plant</italic></source> <volume>34</volume> <fpage>95</fpage>&#x2013;<lpage>96</lpage>.</citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Palmer</surname> <given-names>J. D.</given-names></name> <name><surname>Thompson</surname> <given-names>W. F.</given-names></name></person-group> (<year>1982</year>). <article-title>Chloroplast DNA rearrangements are more frequent when a large inverted repeat sequence is lost.</article-title> <source><italic>Cell</italic></source> <volume>29</volume> <fpage>537</fpage>&#x2013;<lpage>550</lpage>. <pub-id pub-id-type="doi">10.1016/0092-8674(82)90170-2</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Read</surname> <given-names>D. J.</given-names></name></person-group> (<year>1991</year>). <article-title>Mycorrhizas in ecosystems.</article-title> <source><italic>Cell. Mol. Life Sci.</italic></source> <volume>47</volume> <fpage>376</fpage>&#x2013;<lpage>391</lpage>. <pub-id pub-id-type="doi">10.1007/BF01972080</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sa</surname> <given-names>Q.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Sun</surname> <given-names>Y.</given-names></name></person-group> (<year>2003</year>). <article-title>The promoter of an antifungal protein gene from <italic>Gastrodia elata</italic> confers tissue -specific and fungus-inducible expression patterns and responds to both salicylic acid and jasmonic acid.</article-title> <source><italic>Plant Cell Rep.</italic></source> <volume>22</volume> <fpage>79</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1007/s00299-003-0664-z</pub-id> <pub-id pub-id-type="pmid">12838365</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sandelius</surname> <given-names>A. S.</given-names></name> <name><surname>Aronsson</surname> <given-names>H.</given-names></name></person-group> (<year>2009</year>). &#x201C;<article-title>The chloroplast: interactions with the environment</article-title>,&#x201D; in <source><italic>Plant Cell Monographs</italic></source>, <role>ed.</role> <person-group person-group-type="editor"><name><surname>Nick</surname> <given-names>P.</given-names></name></person-group> (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer</publisher-name>).</citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Keller</surname> <given-names>O.</given-names></name> <name><surname>Gunduz</surname> <given-names>I.</given-names></name> <name><surname>Hayes</surname> <given-names>A.</given-names></name> <name><surname>Waack</surname> <given-names>S.</given-names></name> <name><surname>Morgenstern</surname> <given-names>B.</given-names></name></person-group> (<year>2006</year>). <article-title>AUGUSTUS: Ab initio prediction of alternative transcripts.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>34</volume> <fpage>W435</fpage>&#x2013;<lpage>W439</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkl200</pub-id> <pub-id pub-id-type="pmid">16845043</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trapnell</surname> <given-names>C.</given-names></name> <name><surname>Pachter</surname> <given-names>L.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2009</year>). <article-title>TopHat: discovering splice junctions with RNA-Seq.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>1105</fpage>&#x2013;<lpage>1111</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp120</pub-id> <pub-id pub-id-type="pmid">19289445</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Bauw</surname> <given-names>G.</given-names></name> <name><surname>Van Damme</surname> <given-names>E. J.</given-names></name> <name><surname>Peumans</surname> <given-names>W. J.</given-names></name> <name><surname>Chen</surname> <given-names>Z. L.</given-names></name> <name><surname>Van Montagu</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2001</year>). <article-title>Gastrodianin-like mannose-binding proteins: a novel class of plant proteins with antifungal properties.</article-title> <source><italic>Plant J.</italic></source> <volume>25</volume> <fpage>651</fpage>&#x2013;<lpage>661</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-313x.2001.00999.x</pub-id> <pub-id pub-id-type="pmid">11319032</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Waterhouse</surname> <given-names>R. M.</given-names></name> <name><surname>Seppey</surname> <given-names>M.</given-names></name> <name><surname>Sim&#x00E3;o</surname> <given-names>F. A.</given-names></name> <name><surname>Manni</surname> <given-names>M.</given-names></name> <name><surname>Ioannidis</surname> <given-names>P.</given-names></name> <name><surname>Klioutchnikov</surname> <given-names>G.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>BUSCO applications from quality assessments to gene prediction and phylogenomics.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>35</volume> <fpage>543</fpage>&#x2013;<lpage>548</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx319</pub-id> <pub-id pub-id-type="pmid">29220515</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wicke</surname> <given-names>S.</given-names></name> <name><surname>Muller</surname> <given-names>K. F.</given-names></name> <name><surname>De Pamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Quandt</surname> <given-names>D.</given-names></name> <name><surname>Wickett</surname> <given-names>N. J.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Mechanisms of functional and physical genome reduction in photosynthetic and nonphotosynthetic parasitic plants of the broomrape family.</article-title> <source><italic>Plant Cell</italic></source> <volume>25</volume> <fpage>3711</fpage>&#x2013;<lpage>3725</lpage>. <pub-id pub-id-type="doi">10.1105/tpc.113.113373</pub-id> <pub-id pub-id-type="pmid">24143802</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wicke</surname> <given-names>S.</given-names></name> <name><surname>Schaferhoff</surname> <given-names>B.</given-names></name> <name><surname>DePamphilis</surname> <given-names>C. W.</given-names></name> <name><surname>Muller</surname> <given-names>K. F.</given-names></name></person-group> (<year>2014</year>). <article-title>Disproportional plastome-wide increase of substitution rates and relaxed purifying selection in genes of carnivorous Lentibulariaceae.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>31</volume> <fpage>529</fpage>&#x2013;<lpage>545</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst261</pub-id> <pub-id pub-id-type="pmid">24344209</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wyman</surname> <given-names>S. K.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name> <name><surname>Boore</surname> <given-names>J. L.</given-names></name></person-group> (<year>2004</year>). <article-title>Automatic annotation of organellar genomes with DOGMA.</article-title> <source><italic>Bioinformatics</italic></source> <volume>20</volume> <fpage>3252</fpage>&#x2013;<lpage>3255</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bth352</pub-id> <pub-id pub-id-type="pmid">15180927</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Tian</surname> <given-names>Y.</given-names></name> <name><surname>Lian</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>The genome of dendrobium officinale illuminates the biology of the important traditional chinese orchid herb.</article-title> <source><italic>Mol. Plant</italic></source> <volume>8</volume> <fpage>922</fpage>&#x2013;<lpage>934</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2014.12.011</pub-id> <pub-id pub-id-type="pmid">25825286</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>P.</given-names></name> <name><surname>Zhou</surname> <given-names>H.</given-names></name> <name><surname>Qian</surname> <given-names>J.</given-names></name> <name><surname>Xu</surname> <given-names>H.</given-names></name> <name><surname>Shao</surname> <given-names>Q.</given-names></name> <name><surname>Li</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The complete chloroplast genome sequence of <italic>Dendrobium officinale</italic>.</article-title> <source><italic>Mitochondrial DNA DNA Mapp. Seq. Anal.</italic></source> <volume>27</volume> <fpage>1262</fpage>&#x2013;<lpage>1264</lpage>. <pub-id pub-id-type="doi">10.3109/19401736.2014.945547</pub-id> <pub-id pub-id-type="pmid">25103425</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Z.</given-names></name></person-group> (<year>2007</year>). <article-title>PAML 4: phylogenetic analysis by maximum likelihood.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>24</volume> <fpage>1586</fpage>&#x2013;<lpage>1591</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msm088</pub-id> <pub-id pub-id-type="pmid">17483113</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>Y.</given-names></name> <name><surname>Jin</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Zhao</surname> <given-names>X.</given-names></name> <name><surname>Zhou</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>The Gastrodia elata genome provides insights into plant adaptation to heterotrophy.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>9</volume>:<issue>1615</issue>. <pub-id pub-id-type="doi">10.1038/s41467-018-03423-5</pub-id> <pub-id pub-id-type="pmid">29691383</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>G. Q.</given-names></name> <name><surname>Liu</surname> <given-names>K. W.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Lohaus</surname> <given-names>R.</given-names></name> <name><surname>Hsiao</surname> <given-names>Y. Y.</given-names></name> <name><surname>Niu</surname> <given-names>S. C.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>The Apostasia genome and the evolution of orchids.</article-title> <source><italic>Nature</italic></source> <volume>549</volume> <fpage>379</fpage>&#x2013;<lpage>383</lpage>. <pub-id pub-id-type="doi">10.1038/nature23897</pub-id> <pub-id pub-id-type="pmid">28902843</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>W. J.</given-names></name></person-group> (<year>1980</year>). <article-title>The biological relationship of gastrodia elata and armillaria mellea.</article-title> <source><italic>Bull. Bot.</italic></source> <volume>22</volume> <fpage>57</fpage>&#x2013;<lpage>62</lpage>.</citation></ref>
</ref-list>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://sourceforge.net/projects/soapdenovo2/files/GapCloser/">http://sourceforge.net/projects/soapdenovo2/files/GapCloser/</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="https://sourceforge.net/projects/bowtie-bio/files/bowtie2/2.3.4.3">https://sourceforge.net/projects/bowtie-bio/files/bowtie2/2.3.4.3</ext-link></p></fn>
<fn id="footnote3">
<label>3</label>
<p><ext-link ext-link-type="uri" xlink:href="http://ccb.jhu.edu/software/tophat/index.shtml">http://ccb.jhu.edu/software/tophat/index.shtml</ext-link></p></fn>
<fn id="footnote4">
<label>4</label>
<p><ext-link ext-link-type="uri" xlink:href="https://github.com/trinityrnaseq/trinityrnaseq/releases">https://github.com/trinityrnaseq/trinityrnaseq/releases</ext-link></p></fn>
<fn id="footnote5">
<label>5</label>
<p><ext-link ext-link-type="uri" xlink:href="http://cole-trapnell-lab.github.io/cufflinks/cuffdiff/index.html">http://cole-trapnell-lab.github.io/cufflinks/cuffdiff/index.html</ext-link></p></fn>
<fn id="footnote6">
<label>6</label>
<p><ext-link ext-link-type="uri" xlink:href="ftp://ftp.ebi.ac.uk/pub/software/unix/iprscan/5/5.32-71.0/interproscan-5.32-71.0-64-bit.tar.gz">ftp://ftp.ebi.ac.uk/pub/software/unix/iprscan/5/5.32-71.0/interproscan-5.32-71.0-64-bit.tar.gz</ext-link></p></fn>
<fn id="footnote7">
<label>7</label>
<p><ext-link ext-link-type="uri" xlink:href="http://www.drive5.com/muscle/downloads.htm">http://www.drive5.com/muscle/downloads.htm</ext-link></p></fn>
<fn id="footnote8">
<label>8</label>
<p><ext-link ext-link-type="uri" xlink:href="http://nbisweden.github.io/MrBayes/download.html">http://nbisweden.github.io/MrBayes/download.html</ext-link></p></fn>
<fn id="footnote9">
<label>9</label>
<p><ext-link ext-link-type="uri" xlink:href="http://evomics.org/resources/software/molecular-evolution-software/paml/">http://evomics.org/resources/software/molecular-evolution-software/paml/</ext-link></p></fn>
<fn id="footnote10">
<label>10</label>
<p><ext-link ext-link-type="uri" xlink:href="http://dogma.ccbb.utexas.edu">http://dogma.ccbb.utexas.edu</ext-link></p></fn>
<fn id="footnote11">
<label>11</label>
<p><ext-link ext-link-type="uri" xlink:href="https://chlorobox.mpimp-golm.mpg.de/OGDraw-Downloads.html">https://chlorobox.mpimp-golm.mpg.de/OGDraw-Downloads.html</ext-link></p></fn>
</fn-group>
</back>
</article>