<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2022.947164</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Reference quality genome sequence of Indian pomegranate cv. &#x2018;Bhagawa&#x2019; (<italic>Punica granatum</italic> L.)</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Roopa Sowjanya</surname> <given-names>P.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c005"><sup>&#x002A;</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1325486/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Shilpa</surname> <given-names>Parashuram</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/687472/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Patil</surname> <given-names>Goudappa Prakash</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x002A;</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1086851/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Babu</surname> <given-names>Dhinesh Karuppannan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1246881/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sharma</surname> <given-names>Jyotsana</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1246908/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sangnure</surname> <given-names>Vipul R.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Mundewadikar</surname> <given-names>Dhananjay M.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1246381/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Natarajan</surname> <given-names>Purushothaman</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c004"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1327229/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Marathe</surname> <given-names>Arvind Rajiv</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Reddy</surname> <given-names>Umesh K.</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/367393/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Singh</surname> <given-names>Vikram Nripendra</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/502249/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>ICAR-National Research Centre on Pomegranate (NRCP)</institution>, <addr-line>Solapur</addr-line>, <country>India</country></aff>
<aff id="aff2"><sup>2</sup><institution>CSIR-National Chemical Laboratory</institution>, <addr-line>Pune</addr-line>, <country>India</country></aff>
<aff id="aff3"><sup>3</sup><institution>Gus R. Douglass Institute and Department of Biology, West Virginia State University</institution>, <addr-line>Institute, WV</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Giuseppe Ferrara, University of Bari Aldo Moro, Italy</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Jiyu Li, Institute of Horticulture Research, China; Nimisha Sharma, Indian Agricultural Research Institute (ICAR), India</p></fn>
<corresp id="c001">&#x002A;Correspondence: Nripendra Vikram Singh, <email>nripendras72@gmail.com</email></corresp>
<corresp id="c002">Umesh K. Reddy, <email>ureddy@wvstateu.edu</email></corresp>
<corresp id="c003">Prakash Goudappa Patil, <email>patilbt@gmail.com</email></corresp>
<corresp id="c004">Purushothaman Natarajan, <email>pnatarajan@wvstateu.edu</email></corresp>
<corresp id="c005">P. Roopa Sowjanya, <email>2010rupasowjanya@gmail.com</email></corresp>
<fn fn-type="equal" id="fn002"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn fn-type="other" id="fn004"><p>This article was submitted to Plant Breeding, a section of the journal Frontiers in Plant Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>15</day>
<month>09</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>947164</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>05</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>07</day>
<month>07</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2022 Roopa Sowjanya, Shilpa, Patil, Babu, Sharma, Sangnure, Mundewadikar, Natarajan, Marathe, Reddy and Singh.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Roopa Sowjanya, Shilpa, Patil, Babu, Sharma, Sangnure, Mundewadikar, Natarajan, Marathe, Reddy and Singh</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Pomegranate is an important fruit crop for ensuring livelihood and nutrition security in fragile semi-arid regions of the globe having limited irrigation resources. This is a high-value, nutritionally rich, and export-oriented agri-commodity that ensures high returns on investment to growers across the world. Although it is a valuable fruit crop, it has received only a limited genomics research outcome. To fast-track the pomegranate improvement program, <italic>de novo</italic> whole-genome sequencing of the main Indian cultivar &#x2018;Bhagawa&#x2019; was initiated by the Indian Council of Agricultural Research&#x2013;National Research Center on Pomegranate (ICAR&#x2013;NRCP). We have demonstrated that a combination of commercially available technologies from Illumina, PacBio, 10X Genomics, and BioNano Genomics could be used efficiently for sequencing and reference-grade <italic>de novo</italic> assembly of the pomegranate genome. The research led to a final reference-quality genome assembly for &#x2018;Bhagawa&#x2019; of 346.08 Mb in 342 scaffolds and an average N50 of 16.12 Mb and N90 of 1088.62 Kb. This assembly covered more than 98% of the estimated pomegranate genome size, 352.54 Mb. The LTR assembly index (LAI) value of 10 and 93.68% Benchmarking Universal Single-Copy Orthologs (BUSCO) completeness score over the 1,440 ortholog genes of the completed pomegranate genome indicates the quality of the assembled pomegranate genome. Furthermore, 29,435 gene models were discovered with a mean transcript length of 2,954 bp and a mean coding sequence length 1,090 bp. Four transcript data samples of pomegranate tissues were mapped over the assembled &#x2018;Bhagawa&#x2019; genome up to 95% significant matches, indicating the high quality of the assembled genome. We have compared the &#x2018;Bhagawa&#x2019; genome with the genomes of the pomegranate cultivars &#x2018;Dabenzi&#x2019; and &#x2018;Taishanhong.&#x2019; We have also performed whole-genome phylogenetic analysis using Computational Analysis of Gene Family Evolution (CAFE) and found that <italic>Eucalyptus grandis</italic> and pomegranate diverged 64 (60&#x2013;70) million years ago. About 1,573 protein-coding resistance genes identified in the &#x2018;Bhagawa&#x2019; genome were classified into 32 domains. In all, 314 copies of miRNA belonging to 26 different families were identified in the &#x2018;Bhagawa&#x2019; genome. The reference-quality genome assembly of &#x2018;Bhagawa&#x2019; is certainly a significant genomic resource for accelerated pomegranate improvement.</p>
</abstract>
<kwd-group>
<kwd>pomegranate</kwd>
<kwd>PacBio</kwd>
<kwd>Long Terminal Repeats Assembly Index (LAI)</kwd>
<kwd>genome sequencing</kwd>
<kwd>hybrid genome assembly</kwd>
</kwd-group>
<contract-sponsor id="cn001">Indian Council of Agricultural Research<named-content content-type="fundref-id">10.13039/501100001503</named-content></contract-sponsor>
<counts>
<fig-count count="8"/>
<table-count count="7"/>
<equation-count count="0"/>
<ref-count count="65"/>
<page-count count="17"/>
<word-count count="9207"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>Introduction</title>
<p>Pomegranate (<italic>Punica granatum</italic> L.), a diploid fruit crop species (2n = 16), is a member of the lythraceae family (<xref ref-type="bibr" rid="B17">Graham and Graham, 2014</xref>; <xref ref-type="bibr" rid="B5">Berger et al., 2016</xref>). The <italic>Punica</italic> genus has two species: <italic>P. granatum</italic> and <italic>P. protopunica</italic>. All cultivated-type pomegranates belong to <italic>P. granatum</italic>. <italic>P. protopunica</italic> is considered an ancestor of cultivated pomegranates and has contributed to the evolutionary process. However, <italic>P. protopunica</italic> is endemic to the Socotra Islands (Yemen) and is not available in most of the major pomegranate-growing countries of the world. To trace the evolutionary history of cultivated pomegranate, two wild pomegranate types, <italic>Daru</italic> and <italic>P. granatum</italic> var. Nana, were used (<xref ref-type="bibr" rid="B34">Moriguchi et al., 1987</xref>; <xref ref-type="bibr" rid="B18">Guarino et al., 1990</xref>; <xref ref-type="bibr" rid="B32">Mars, 2000</xref>; <xref ref-type="bibr" rid="B30">Levin, 2006</xref>; <xref ref-type="bibr" rid="B10">da Silva et al., 2013</xref>; <xref ref-type="bibr" rid="B15">Ferrara et al., 2021</xref>).</p>
<p>Pomegranate is globally grown on approximately 0.55 million ha with a production of about 6.5 million tonnes, and it is considered an important fruit crop in semi-arid tropical areas (<xref ref-type="bibr" rid="B15">Ferrara et al., 2021</xref>). It is an economically important fruit crop with high nutraceutical value. Pomegranate has approximately 11.33 mmol of antioxidants, such as punicalagin and other ellagitannin-based compounds per 100 g of fruit. These antioxidants have medicinal properties for heart disease and prostate cancer (<xref ref-type="bibr" rid="B19">Halvorsen et al., 2002</xref>; <xref ref-type="bibr" rid="B20">Holland et al., 2009</xref>; <xref ref-type="bibr" rid="B22">Johanningsmeier and Harris, 2011</xref>).</p>
<p>Pomegranate cultivation started in 3000 BC in Central Asia (<xref ref-type="bibr" rid="B8">Chandra et al., 2010</xref>). The pomegranate crop has versatile adaptability because of its hardy nature and low water requirements across the Mediterranean, tropical and subtropical regions of Iran, India, China, Turkey, Spain, Tunisia, Morocco, and Afghanistan. Globally, India is the largest producer of pomegranate, with 2.8 million tonnes of annual production contributing about 40% of the global share, followed by China (1.6 million tonnes), Iran (0.7 million tonnes), and Turkey (0.5 million tonnes) (<xref ref-type="bibr" rid="B15">Ferrara et al., 2021</xref>). Pomegranate is considered a strategic crop for ensuring nutritional and livelihood security in water-scarce regions of the world, hence, to some extent, it can help to mitigate global warming.</p>
<p>Due to of the alluring monetary return per unit area from this crop and increased demand for table and processed products with high export potential, pomegranate cultivation has experienced a tremendous increase in area, production, and export from India during the last 2 decades. In India, the pomegranate acreage is 0.275 million ha, with an annual production of 3.256 million tonnes. It is extensively grown in Maharashtra, Gujarat, Karnataka, Andhra Pradesh, and Telangana states and is quickly being established in Himachal Pradesh, Rajasthan, and Madhya Pradesh. Small areas of pomegranate are under cultivation in Tamil Nadu, Punjab, Haryana, Jharkhand, and Jammu and Kashmir (2019-20<sup><xref ref-type="fn" rid="footnote1">1</xref></sup>). Export of pomegranate has increased from 18.21 thousand MT (Rs. 710 million) in 2010&#x2013;2011 to about 99.04 thousand MT (Rs.6888 million) in 2021&#x2013;2022<sup><xref ref-type="fn" rid="footnote2">2</xref></sup>.</p>
<p>Although the area under pomegranate cultivation is increasing because it is grown in low-input and risk-prone marginal environments, there is a large gap between the expected yield potential (average productivity of some of the major pomegranate-producing countries is about 20 tonnes/ha) and the realized yield potential on farmers&#x2019; fields (&#x223C;12 tonnes/ha) in India. This situation could be due to various biotic and abiotic stresses affecting the crop. Therefore, to accelerate the application of genomics to improve the yield and quality of pomegranate, we assembled the genome sequence of the Indian pomegranate cultivar &#x2018;Bhagawa&#x2019; and performed further analysis. The Indian pomegranate industry is ruled by a single cultivar, &#x2018;Bhagawa,&#x2019; having excellent exportable fruit qualities with high export demand. It is also preferred for domestic consumption. However, this variety is highly susceptible to major diseases and pests, such as bacterial blight, <italic>Ceratocystis</italic> wilt, fruit sucking moths, etc., that are significantly reducing the yield potential of this variety. Therefore, we selected &#x2018;Bhagawa&#x2019; for assembling a quality genome to decode important genes for resistance/susceptibility, which can be later targeted for genome-editing applications to improve this variety.</p>
<p>Despite the availability of the draft genome sequences of cv. &#x2018;Taishanhong&#x2019; and &#x2018;Dabenzi&#x2019; pomegranate of China and transcriptome assemblies, deeper knowledge of the genetic basis of yield, quality, and stress tolerance for genetic improvement is lacking in pomegranate (<xref ref-type="bibr" rid="B38">Ono et al., 2011</xref>; <xref ref-type="bibr" rid="B39">Ophir et al., 2014</xref>; <xref ref-type="bibr" rid="B46">Saminathan et al., 2016</xref>; <xref ref-type="bibr" rid="B44">Qin et al., 2017</xref>; <xref ref-type="bibr" rid="B64">Yuan Z. et al., 2018</xref>). Also, the unavailability of a high-quality reference genome limits molecular studies in pomegranate. Therefore, in the present study, we aimed to assemble the high-quality genome of cv. &#x2018;Bhagawa&#x2019; by using third- and fourth-generation sequencing technologies to capture the entire genome with high continuity. We also compared the assembly quality of our genome with available draft genomes of pomegranate. The availability of the complete genome sequence will accelerate the use of pomegranate genepool resources in molecular breeding. Also, we developed genome-wide simple sequence repeat (SSR) markers for gene discovery and molecular breeding applications. The genomic resources from the current study will benefit the pomegranate research community in discovering the trait-specific genes. It will also increase the efficiency of pomegranate improvement by integrating novel biotechnological tools, such as genome editing and genomics-assisted selection, to complement conventional breeding programs of pomegranate variety improvement with resistance to biotic and abiotic stresses.</p>
</sec>
<sec id="S2" sec-type="results">
<title>Results</title>
<sec id="S2.SS1">
<title>Genome sequencing and <italic>de novo</italic> genome assembly</title>
<p>The study aimed to generate the high-quality reference-level genome of the Indian pomegranate cultivar &#x2018;Bhagawa.&#x2019; To achieve this, we opted for short- to long-read sequencing with second- to fourth-generation technologies, such as Illumina, 10X genomics, PacBio, and BioNano Optical mapping. Hence, we could generate enormous genomic data for each technology (<xref ref-type="table" rid="T1">Table 1</xref>). Using the direct-label and stain (DLS) technology of the Bionano platform, we generated data of 1191.68 Gb covering 340.4 Mb of the genome (&#x223C;352.54 Mb of an estimated genome) followed by the use of the HiSeqX platform generating data of 77.08 Gb covering 220 Mb of the genome. The sequence information generated from all these technologies could lead to hybrid scaffolding and the development of a reference-quality genome for &#x2018;Bhagawa.&#x2019; The detailed methodology with steps followed to complete the genome is depicted in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Summary of data generated by using genome sequencing platforms for <italic>Punica granatum</italic> cv. &#x2018;Bhagawa&#x2019;.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">DNA preparation protocols</td>
<td valign="top" align="left">Sequencing/capturing platform</td>
<td valign="top" align="left">Data generated (Gb)</td>
<td valign="top" align="left">Genome coverage &#x223C; 350 Mb</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Paired End</td>
<td valign="top" align="left">Illumina HiSeq 2500</td>
<td valign="top" align="left">75.46</td>
<td valign="top" align="left">215.6</td>
</tr>
<tr>
<td valign="top" align="left">10X Chromium</td>
<td valign="top" align="left">HiSeq X</td>
<td valign="top" align="left">77.08</td>
<td valign="top" align="left">220</td>
</tr>
<tr>
<td valign="top" align="left">SMRT-Bell</td>
<td valign="top" align="left">PacBio Sequel</td>
<td valign="top" align="left">31.42</td>
<td valign="top" align="left">89.74</td>
</tr>
<tr>
<td valign="top" align="left">DLS</td>
<td valign="top" align="left">BioNanoSaphyr</td>
<td valign="top" align="left">1191.68</td>
<td valign="top" align="left">340.4</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn><p>Direct-label and stain &#x2014; DLS.</p></fn>
</table-wrap-foot>
</table-wrap>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Flow diagram of the strategy used for assembling the genome of pomegranate cv. &#x2018;Bhagawa&#x2019;.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g001.tif"/>
</fig>
<p>From the results of preliminary k-mer genome survey analysis for cv. &#x2018;Bhagawa&#x2019; using 10X Chromium datasets, the final genome size was estimated at 352,535,926 bp (352.54 Mb, <italic>k</italic> = 31). The heterozygosity rate was 0.14% and the repeat ratio was 4.17%, with 65.3% unique sequences and 0.72% error rate, as depicted in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Genome scope profile showing the genome size and heterozygosity rate as estimated by using k-mers from the &#x2018;Bhagawa&#x2019; genome.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g002.tif"/>
</fig>
<p>We assembled the genome by using datasets generated from different sequencing platforms and an array of assembling software shown in <xref ref-type="table" rid="T2">Table 2</xref>. Results of five approaches combining different sequencing technologies and assembly software were compared. Among the five approaches, the Bio-nano genomics (BNG) and BNG-assisted Super Scaffolds coupled with BioNano Access assembly software yielded higher genome coverage (343.27&#x2013;353.59 Mb) with limited sequences, 78&#x2013;374, and a higher average N50 of 16.11&#x2013;16.31 Mb for the scaffolds. Thus, BNG coupled with BioNano Access was the best to obtain high-quality assembly of genomes with higher contiguity than 10X and PacBio contigs coupled with Super Nova, Falcon-unzip, and Scaff10x assembly (<xref ref-type="table" rid="T2">Table 2</xref>). Furthermore, we polished the genome assembly to obtain the final assembly by using PBJelly2 and Pilon. The final reference-quality genome was 346.08 Mb with only 342 scaffolds and an average N50 of 16.12 Mb and N90 of 1088.62 Kb (<xref ref-type="table" rid="T2">Table 2</xref>). This assembly covered 98% of the estimated size of the pomegranate genome, 352.54 Mb.</p>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>Statistics at each step of the pomegranate genome assembly.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Technology &#x0026; assembly</td>
<td valign="top" align="left">Software</td>
<td valign="top" align="left">Length (Mbp)</td>
<td valign="top" align="left">No. of sequence/no. of scaffold</td>
<td valign="top" align="left">Contig/scaffold N50 (Mbp)</td>
<td valign="top" align="left">Contig/scaffold N90(Kbp)</td>
<td valign="top" align="left">Longest contig/scaffold (Mbp)</td>
<td valign="top" align="left">Median contig/scaffold (Kbp)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">10X Scaffolds</td>
<td valign="top" align="left">SuperNova</td>
<td valign="top" align="left">331.1</td>
<td valign="top" align="left">12063</td>
<td valign="top" align="left">1.31</td>
<td valign="top" align="left">9.6</td>
<td valign="top" align="left">7.16</td>
<td valign="top" align="left">3.6</td>
</tr>
<tr>
<td valign="top" align="left">PacBio Contigs</td>
<td valign="top" align="left">Falcon-unzip</td>
<td valign="top" align="left">337.12</td>
<td valign="top" align="left">446</td>
<td valign="top" align="left">6.8</td>
<td valign="top" align="left">487.9</td>
<td valign="top" align="left">18.95</td>
<td valign="top" align="left">77.27</td>
</tr>
<tr>
<td valign="top" align="left">PacBio contigs + 10X reads (hybrid scaffolds)</td>
<td valign="top" align="left">Scaff10x</td>
<td valign="top" align="left">337.72</td>
<td valign="top" align="left">432</td>
<td valign="top" align="left">9.88</td>
<td valign="top" align="left">508.06</td>
<td valign="top" align="left">18.95</td>
<td valign="top" align="left">73.46</td>
</tr>
<tr>
<td valign="top" align="left">BNG-assisted SuperScaffolds</td>
<td valign="top" align="left">BioNano Access (All Scaffolds)</td>
<td valign="top" align="left">343.27</td>
<td valign="top" align="left">374</td>
<td valign="top" align="left">16.11</td>
<td valign="top" align="left">1059.69</td>
<td valign="top" align="left">22.45</td>
<td valign="top" align="left">54.17</td>
</tr>
<tr>
<td valign="top" align="left">PBJelly2 and Pilon polished genome</td>
<td valign="top" align="left">PBJelly2 and Pilon</td>
<td valign="top" align="left">346.08</td>
<td valign="top" align="left">342</td>
<td valign="top" align="left">16.12</td>
<td valign="top" align="left">1088.62</td>
<td valign="top" align="left">22.45</td>
<td valign="top" align="left">65.89</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>We assessed the genome quality by using the LTR Assembly Index (LAI) based on LTR retrotransposons that account for the largest genome component in most plant genomes. Our genome had an LAI index of 10, indicating a reference-quality genome as per the LAI index scale of &#x2264; 10 to 20 for reference-quality genomes (<xref ref-type="bibr" rid="B40">Ou et al., 2018</xref>). Finally, the qualities of different assemblies were assessed by using BUSCO. The complete genomic landscape of the &#x2018;Bhagawa&#x2019; genome is presented in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>The genomic landscape of Indian pomegranate cv. &#x2018;Bhagawa.&#x2019; Shows the distribution of the scaffold length, guanine and cytosine GC content, repeat content, gene density, and interactions of scaffolds, with densities calculated in 100-kb window size. The tracks from outside to inside are (1) circular representations of scaffolds 1-342, (2) distribution of Guanine and Cytosine (GC) content in scaffolds, (3) distribution of repeat content, (4) distribution of gene density in scaffolds, and (5) synteny blocks from linked regions of scaffolds.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g003.tif"/>
</fig>
<p>To judge our genome&#x2019;s quality, we compared the assembly statistics of the &#x2018;Bhagawa&#x2019; genome with the other two draft genomes for pomegranates cv. &#x2018;Taishanhong&#x2019; and &#x2018;Dabenzi.&#x2019; According to the assembly parameters listed, our genome qualifies for all parameters with high standards as compared with the previous genomes (<xref ref-type="table" rid="T3">Table 3</xref>). For instance, our final assembly covered 346.08 Mb (98% of estimated genome size) in 342 scaffolds with an N50 of 16.12 Mb and a contig N50 of 6.8 Mb with high GC content (41.01%) <bold>(NCBI database Bio project: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA562100">PRJNA562100</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505392">PRJNA505392</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505397">PRJNA505397</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505398">PRJNA505398</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505582">PRJNA505582</ext-link>, and <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA445950">PRJNA445950</ext-link>)</bold>. A total of 29,435 gene models were discovered, with a mean transcript length of 2,954 bp and a mean coding sequence length 1,090 bp as compared with the previous draft genomes (<xref ref-type="supplementary-material" rid="DS1">Supplementary File 1</xref>). The LAI index that was calculated for all three genomes was 10 for &#x2018;Bhagawa,&#x2019; 8 for &#x2018;Taishanhong,&#x2019; and 2.5 for &#x2018;Dabenzi,&#x2019; so our genome is of high reference quality as compared with the other draft pomegranate genomes. However, more recently, a chromosome-scale genome assembly of soft-seeded pomegranate cv. &#x2018;Tunisia&#x2019; was reported; the assembly involved the combined use of single-molecule sequencing and high-throughput chromosome conformation capture techniques. The genome covers 320.31 Mb, with 39.96 Mb scaffold N50 value and 4.49 Mb contig N50 value, and the genome includes 33,594 protein-coding genes (<xref ref-type="bibr" rid="B31">Luo et al., 2020</xref>).</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Comparative metrics of the &#x2018;Bhagawa&#x2019; genome with genomes of other pomegranate varieties available in National Center for Biotechnology Information (NCBI).</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">S. no.</td>
<td valign="top" align="left">Assembly parameters</td>
<td valign="top" align="left">&#x2018;Taishanhong&#x2019; (illumina)&#x002A;<break/>(<xref ref-type="bibr" rid="B64">Yuan Z. et al., 2018</xref>)</td>
<td valign="top" align="left">&#x2018;Dabenzi&#x2019; (illumina)&#x002A;<break/>(<xref ref-type="bibr" rid="B44">Qin et al., 2017</xref>)</td>
<td valign="top" align="left">&#x2018;Bhagawa&#x2019;<break/>(hybrid approach)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">Estimated genome size (Mb)</td>
<td valign="top" align="left">336</td>
<td valign="top" align="left">328.13</td>
<td valign="top" align="left">352.53 (<italic>k</italic> = 31)</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">Total size of assembled scaffolds (Mb)</td>
<td valign="top" align="left">274</td>
<td valign="top" align="left">296.38</td>
<td valign="top" align="left">346.08</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">Number of scaffolds (&#x2265; 1 kb)</td>
<td valign="top" align="left">2,117</td>
<td valign="top" align="left">2,601</td>
<td valign="top" align="left">342</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">N50 scaffold length (Mb)</td>
<td valign="top" align="left">1.7</td>
<td valign="top" align="left">2.3</td>
<td valign="top" align="left">16.12</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">Longest scaffold (Mb)</td>
<td valign="top" align="left">7.6</td>
<td valign="top" align="left">9.97</td>
<td valign="top" align="left">22.45</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">Total size of assembled contigs (Mb)</td>
<td valign="top" align="left">269</td>
<td valign="top" align="left">N/A</td>
<td valign="top" align="left">337.7</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">Number of contigs (&#x2265; 1 kb)</td>
<td valign="top" align="left">7,088</td>
<td valign="top" align="left">N/A</td>
<td valign="top" align="left">446</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left">N50 contig length</td>
<td valign="top" align="left">97 Kb</td>
<td valign="top" align="left">82.31 Kb</td>
<td valign="top" align="left">6.8 Mb</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="left">Largest contig</td>
<td valign="top" align="left">528.6 Kb</td>
<td valign="top" align="left">N/A</td>
<td valign="top" align="left">18.89 Mb</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left">GC content (%)</td>
<td valign="top" align="left">39.2</td>
<td valign="top" align="left">39.64</td>
<td valign="top" align="left">41.01</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="left">Number of gene models<xref ref-type="table-fn" rid="t3fns2">&#x002A;&#x002A;</xref></td>
<td valign="top" align="left">30,903</td>
<td valign="top" align="left">29,226</td>
<td valign="top" align="left">29,435</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="left">Mean transcript length (bp)<xref ref-type="table-fn" rid="t3fns2">&#x002A;&#x002A;</xref></td>
<td valign="top" align="left">2332.8</td>
<td valign="top" align="left">2,543</td>
<td valign="top" align="left">2,954</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">Mean coding sequence length (bp)<xref ref-type="table-fn" rid="t3fns2">&#x002A;&#x002A;</xref></td>
<td valign="top" align="left">1110.4</td>
<td valign="top" align="left">1,077</td>
<td valign="top" align="left">1,090</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="left">Mean number of exons per gene<xref ref-type="table-fn" rid="t3fns2">&#x002A;&#x002A;</xref></td>
<td valign="top" align="left">4.52</td>
<td valign="top" align="left">4</td>
<td valign="top" align="left">5.1</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="left">Mean exon length (bp)<xref ref-type="table-fn" rid="t3fns2">&#x002A;&#x002A;</xref></td>
<td valign="top" align="left">245.9</td>
<td valign="top" align="left">308</td>
<td valign="top" align="left">286</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="t3fns1"><p>&#x002A;Based on genomes submitted in NCBI.</p></fn>
<fn id="t3fns2"><p>&#x002A;&#x002A;Based on annotation information either in NCBI or in the manuscript.</p></fn>
<fn id="t3fns3"><p>N/A, not available.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="S2.SS2">
<title>Synteny between genome assemblies</title>
<p>To assess the syntenic relationships between the newly assembled &#x2018;Bhagawa&#x2019; genome and the two previously reported draft genomes, we performed global whole-genome alignments using Minimap2 with parameter &#x201C;asm10&#x201D;; the synteny relationships were visualized as a Jupiter Plot (<xref ref-type="bibr" rid="B23">Jones et al., 2014</xref>). A Circos-based genome assembly consistency plot was used to view large-scale translocations and other large structural variations (<xref ref-type="bibr" rid="B28">Krzywinski et al., 2009</xref>; <xref ref-type="bibr" rid="B23">Jones et al., 2014</xref>). The connecting bands within the circle represent regions of synteny, whereas the blocks on the arc of the circle represent the largest scaffolds in the assembly. The lack of diagonal lines extending from the middle of the scaffold block suggests no definite breaks in synteny between the two assemblies at 10-Kb resolution. We found perfect macro synteny between the &#x2018;Dabenzi&#x2019; vs. &#x2018;Bhagawa&#x2019; genome compared to &#x2018;Taishanhong&#x2019; vs. &#x2018;Bhagawa&#x2019; (<xref ref-type="fig" rid="F4">Figure 4</xref>). These results indicated higher syntenic relationships between &#x2018;Bhagawa&#x2019; and &#x2018;Dabenzi&#x2019; followed by &#x2018;Taishanhiong.&#x2019; Several scaffolds had multiple hits in the &#x2018;Taishanhong&#x2019; vs. &#x2018;Bhagawa&#x2019; plot, thus indicating low levels of genome rearrangements between these two genomes. Similar results were observed with the &#x2018;Dabenzi&#x2019; genome plotted against &#x2018;Taishanhiong.&#x2019;</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Circos visualization of the syntenic relationship of &#x2018;Bhagawa&#x2019; genome with the genomes of &#x2018;Taishanhong&#x2019; and &#x2018;Dabenzi&#x2019; pomegranate varieties.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g004.tif"/>
</fig>
</sec>
<sec id="S2.SS3">
<title>Structural variation (SV) analyzes</title>
<p>An SV represents a major source of genetic diversity, we investigated overall SVs in the pomegranate genome. We aligned the &#x2018;Bhagawa&#x2019; genome with the &#x2018;Taishanhong&#x2019; and &#x2018;Dabenzi&#x2019; genomes separately by using Assemblytics (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2</xref>). Here, we tried to identify SVs for six different classes: insertion&#x2013;deletion, repeat expansion and contraction, and tandem expansion and contraction, focusing on 1&#x2013;10 Kb between our &#x2018;Bhagawa&#x2019; genome and the other two draft pomegranate genomes. We identified 5.7 Mb and 9.2 Mb SVs for &#x2018;Taishanhong&#x2019; and &#x2018;Dabenzi&#x2019;, respectively, with &#x2018;Bhagawa&#x2019; as a reference (<xref ref-type="supplementary-material" rid="DS1">Supplementary Tables 1A,B</xref> and <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2</xref>). Although, all the three cultivars belong to the same species, <italic>P. granatum</italic>, they have accumulated much higher SVs at the nucleotide level in the genome. The SV graph indicates that except for tandem contraction, much higher SVs were observed between &#x2018;Bhagawa&#x2019; and &#x2018;Dabenzi&#x2019; than between &#x2018;Bhagawa&#x2019; and &#x2018;Taishanhong&#x2019; for all the variant classes. Also, the SVs frequency decreased with the increasing size of the nucleotide sequences analyzed for each class. Among the SVs, insertions and deletions contributed much greater to total variations in the genomes, followed by repeat expansion and contraction.</p>
</sec>
<sec id="S2.SS4">
<title>Repetitive sequences</title>
<p>Most plant genomes have highly repetitive regions with transposable elements. We have analyzed the pomegranate genome for these aspects to reveal the basic structural features of the genome. <italic>De novo</italic> analysis of repetitive elements using the Repeat Modeler software revealed a large proportion of repetitive DNA, comparable to the other higher eukaryotic genomes (<xref ref-type="table" rid="T4">Table 4</xref>). Repeat Modeler generated 1,765 different families of repeats known as the <italic>de novo</italic> repeat reference library. A total of 496,570 repetitive elements were in the genome, covering 179,092,850 bp of sequence. Most of the repetitive elements were the interspersed type, consisting of Class I (retro transposons) and Class II (DNA transposons) elements followed by unclassified elements, small RNA, and satellites. Simple direct repeats and low complexity repeats represented only 1.03% and 0.18% of the total repetitive elements. Classification of the observed transposable elements into known classes revealed that most repetitive sequences were retrotransposons (18.27%), whereas 1.10% were DNA transposons (<xref ref-type="table" rid="T4">Table 4</xref>). The most abundant repeats were long-terminal repeat elements (17.33%), of which 13.57% were Gypsy-type elements and 2.95% Copia-type elements (<xref ref-type="table" rid="T4">Table 4</xref>).</p>
<table-wrap position="float" id="T4">
<label>TABLE 4</label>
<caption><p>Different types of repeat elements identified in the &#x2018;Bhagawa&#x2019; genome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Repeats categories</td>
<td valign="top" align="center">Number of elements</td>
<td valign="top" align="center">Length (bp)</td>
<td valign="top" align="center">Percentage of genome</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Retroelements (Class I):</td>
<td valign="top" align="center">46,207</td>
<td valign="top" align="center">632,42,519</td>
<td valign="top" align="center">18.27</td>
</tr>
<tr>
<td valign="top" align="left">-SINEs</td>
<td valign="top" align="center">300</td>
<td valign="top" align="center">91,705</td>
<td valign="top" align="center">0.03</td>
</tr>
<tr>
<td valign="top" align="left">-LINEs (L1/CIN4)</td>
<td valign="top" align="center">6,571</td>
<td valign="top" align="center">316,0098</td>
<td valign="top" align="center">0.91</td>
</tr>
<tr>
<td valign="top" align="left">-LTR elements:</td>
<td valign="top" align="center">39,336</td>
<td valign="top" align="center">59,990,716</td>
<td valign="top" align="center">17.33</td>
</tr>
<tr>
<td valign="top" align="left">-BEL/Pao</td>
<td valign="top" align="center">1,548</td>
<td valign="top" align="center">241,755</td>
<td valign="top" align="center">0.07</td>
</tr>
<tr>
<td valign="top" align="left">-Ty1/Copia</td>
<td valign="top" align="center">8,596</td>
<td valign="top" align="center">10,208,967</td>
<td valign="top" align="center">2.95</td>
</tr>
<tr>
<td valign="top" align="left">-Gypsy</td>
<td valign="top" align="center">26,478</td>
<td valign="top" align="center">46,959,638</td>
<td valign="top" align="center">13.57</td>
</tr>
<tr>
<td valign="top" align="left">-Retroviral</td>
<td valign="top" align="center">1,204</td>
<td valign="top" align="center">862,209</td>
<td valign="top" align="center">0.25</td>
</tr>
<tr>
<td valign="top" align="left">-Others</td>
<td valign="top" align="center">1,510</td>
<td valign="top" align="center">17,181,47</td>
<td valign="top" align="center">0.50</td>
</tr>
<tr>
<td valign="top" align="left">DNA transposons (Class II):</td>
<td valign="top" align="center">6,188</td>
<td valign="top" align="center">38,20,656</td>
<td valign="top" align="center">1.10</td>
</tr>
<tr>
<td valign="top" align="left">-hobo-Activator</td>
<td valign="top" align="center">992</td>
<td valign="top" align="center">580,336</td>
<td valign="top" align="center">0.17</td>
</tr>
<tr>
<td valign="top" align="left">-Tourist/Harbinger</td>
<td valign="top" align="center">1,733</td>
<td valign="top" align="center">10,14,546</td>
<td valign="top" align="center">0.29</td>
</tr>
<tr>
<td valign="top" align="left">-Rolling-circles</td>
<td valign="top" align="center">3,371</td>
<td valign="top" align="center">21,68,970</td>
<td valign="top" align="center">0.63</td>
</tr>
<tr>
<td valign="top" align="left">-Others</td>
<td valign="top" align="center">92</td>
<td valign="top" align="center">56,804</td>
<td valign="top" align="center">0.02</td>
</tr>
<tr>
<td valign="top" align="left">Unclassified</td>
<td valign="top" align="center">333,789</td>
<td valign="top" align="center">106,506,469</td>
<td valign="top" align="center">30.78</td>
</tr>
<tr>
<td valign="top" align="left">Total interspersed repeats</td>
<td/>
<td valign="top" align="center">173,569,644</td>
<td valign="top" align="center">50.16</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="S2.SS5">
<title>Gene prediction and functional annotation</title>
<p>The complete genome sequence of &#x2018;Bhagawa&#x2019; (&#x223C;346 Mb) was analyzed for gene prediction <italic>ab initio</italic> and by using a homology-based approach with the BRAKER/MAKER pipeline. A total of 29,435 genes were predicted with an average size of 2,954 bp, with average exon and intron sizes of 286 and 368 bp, respectively (<xref ref-type="supplementary-material" rid="DS1">Supplementary File 2</xref>). All predicted genes were functionally annotated by following a consensus approach of known homologous or predictive sequence signatures by Cluster of Orthologous Groups, Gene Ontology, InterProScan, Kyoto Encyclopedia of Genes and Genomes, Uniprot, and EggNOG (<xref ref-type="fig" rid="F5">Figures 5</xref>, <xref ref-type="fig" rid="F6">6</xref>). In total, 96.04% of genes had sufficient similarity entries in databases to tentatively assign gene functions. Only 3.96% of genes remain unannotated. The overall GC content of the genome was 41.01% (<xref ref-type="table" rid="T3">Table 3</xref>). Additionally, 617 transfer RNA genes were predicted in the genome.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Functional annotation of the predicted genes from &#x2018;Bhagawa&#x2019; genome by using NCBI, NR, Kyoto Encyclopedia of Genes and Genomes, Uniport, Gene Ontology, Cluster of Orthologous Groups, and Eukaryotic Orthologous Groups databases.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>Functional classification of genes from &#x2018;Bhagawa&#x2019; genome.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g006.tif"/>
</fig>
<p>The complete genome represented 93.68% of the 1440 ortholog genes, with 64 missing and 27 fragmented genes, according to step-wise BUSCO assessment of the Embryophyta lineage. We also successfully validated the four transcriptome data samples (NCBI database: SRR5187757, SRR5187758, SRR5187763, and SRR5187764) of bacterial blight-challenged pomegranate tissues by mapping them onto the reference genome. As a result, 85% of 95% of reads showed significant matches to the genome (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 3</xref>) (<xref ref-type="bibr" rid="B27">Kozlov et al., 2019</xref>). These results indicated an extremely low proportion of misassemblies in the gene-rich regions. The transcriptome assembly does not necessarily represent all pomegranate genes; it is restricted to the tissue types used, and genes expressed at low levels are likely under-represented.</p>
<p>To reconfirm the phylogenetic position of our newly sequenced pomegranate, cv. &#x2018;Bhagawa,&#x2019; and to identify expansion, contraction, and rapidly evolving gene families in the <italic>Punica</italic> clade in relation to four other sequenced plant genomes (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 1</xref>), we performed whole-genome phylogenetic analysis. For this, we used CAFE software after pruning the gene families containing a single species. From these analyzes, pomegranate and <italic>E. grandis</italic> diverged 64 (60&#x2013;70) million years ago (MYA), after the paleotetraploidy event (109 MYA) was identified in the <italic>E. grandis</italic> genome (<xref ref-type="fig" rid="F7">Figure 7</xref>). Therefore, this whole-genome duplication event is shared by pomegranate and <italic>E. grandis</italic> (<xref ref-type="bibr" rid="B36">Myburg et al., 2014</xref>; <xref ref-type="bibr" rid="B63">Yuan J. et al., 2018</xref>). We also found a higher divergence period between the grape and pomegranate genomes, which suggests that pomegranate and grape did not undergo a recent genome duplication as per results from syntenic block analysis between pomegranate, Eucalyptus, and grape genomes (<xref ref-type="bibr" rid="B36">Myburg et al., 2014</xref>; <xref ref-type="bibr" rid="B63">Yuan J. et al., 2018</xref>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption><p>Phylogenetic tree based on gene families by using Computational Analysis of Gene Family Evolution (CAFE) software.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g007.tif"/>
</fig>
<p>To study the gene families that had expanded or contracted in pomegranate, we have estimated and compared gene gain and loss rates (&#x03BB;) using the two-lambda model for gene families from pomegranate with those of four other representative ancestral species. In total, 965 gene families had expanded in number; 5,406 gene families had contracted in number; and 115 families had rapidly evolved in the pomegranate genome, with &#x03BB; value 0.0059 as compared with its most recent common ancestor, Eucalyptus (<xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref> and <xref ref-type="fig" rid="F7">Figure 7</xref>). However, the grape genome had the most divergent species with gene family evolution (&#x03BB; 0.0038) as compared with the other genomes.</p>
</sec>
<sec id="S2.SS6">
<title>Resistance genes and transcription factor identification</title>
<p>Resistance genes in the &#x2018;Bhagawa&#x2019; genome were identified by using the protein sequence of predicted genes and the Plant Stress Protein Database (PSPDB). A total of 1,573 protein-coding genes were identified as resistance genes, classified into 32 domains. Among these, Kinase, TM (577); Kinase, LRR, TM (203); LRR, TM (194); and kinase (132) domains increased in number (<xref ref-type="table" rid="T5">Table 5</xref>). Transcription factors were predicted by using PlantTFDB, with 1,533 proteins identified as transcription factors in &#x2018;Bhagawa.&#x2019; These transcription factors are divided into 57 transcription factor families. Genes related to MYB were highest in number, followed by bHLH, ERF, NAC, and C2H2 families (<xref ref-type="table" rid="T6">Table 6</xref>).</p>
<table-wrap position="float" id="T5">
<label>TABLE 5</label>
<caption><p>Disease resistance genes identified in &#x2018;Bhagawa&#x2019;.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Domain</td>
<td valign="top" align="center">Number of genes</td>
<td valign="top" align="left">Domain</td>
<td valign="top" align="center">Number of genes</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Kinase, TM</td>
<td valign="top" align="center">577</td>
<td valign="top" align="left">CC, Kinase, LRR, TM</td>
<td valign="top" align="center">10</td>
</tr>
<tr>
<td valign="top" align="left">Kinase, LRR, TM</td>
<td valign="top" align="center">203</td>
<td valign="top" align="left">CC, LRR, TM</td>
<td valign="top" align="center">9</td>
</tr>
<tr>
<td valign="top" align="left">LRR,T M</td>
<td valign="top" align="center">194</td>
<td valign="top" align="left">CC, NBS</td>
<td valign="top" align="center">8</td>
</tr>
<tr>
<td valign="top" align="left">Kinase</td>
<td valign="top" align="center">132</td>
<td valign="top" align="left">LRR, NBS, TIR</td>
<td valign="top" align="center">6</td>
</tr>
<tr>
<td valign="top" align="left">CC, Kinase, TM</td>
<td valign="top" align="center">57</td>
<td valign="top" align="left">CC, LRR, NBS, TIR, TM</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left">NBS, TM</td>
<td valign="top" align="center">57</td>
<td valign="top" align="left">LRR, NBS</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left">LRR, NBS, TIR, TM</td>
<td valign="top" align="center">55</td>
<td valign="top" align="left">CC, LRR, NBS</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left">LRR, NBS, TM</td>
<td valign="top" align="center">42</td>
<td valign="top" align="left">CC, LRR</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">CC, NBS, TM</td>
<td valign="top" align="center">41</td>
<td valign="top" align="left">CC, TIR</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">CC, LRR, NBS, TM</td>
<td valign="top" align="center">37</td>
<td valign="top" align="left">NBS, TIR</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">LRR</td>
<td valign="top" align="center">36</td>
<td valign="top" align="left">TM</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">NBS</td>
<td valign="top" align="center">19</td>
<td valign="top" align="left">CC</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">NBS, TIR, TM</td>
<td valign="top" align="center">19</td>
<td valign="top" align="left">Kinase, LRR</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">TIR</td>
<td valign="top" align="center">17</td>
<td valign="top" align="left">Kinase, NBS, TM</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">CC, Kinase</td>
<td valign="top" align="center">14</td>
<td valign="top" align="left">LRR, TIR</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left">TIR, TM</td>
<td valign="top" align="center">14</td>
<td valign="top" align="left">LRR, TIR, TM</td>
<td valign="top" align="center">1</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap position="float" id="T6">
<label>TABLE 6</label>
<caption><p>Transcription factor families and their counts in &#x2018;Bhagawa&#x2019;.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">TF_family</td>
<td valign="top" align="left">No. of proteins</td>
<td valign="top" align="left">TF_family</td>
<td valign="top" align="left">No. of proteins</td>
<td valign="top" align="left">TF_family</td>
<td valign="top" align="left">No. of proteins</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">MYB</td>
<td valign="top" align="left">157</td>
<td valign="top" align="left">TCP</td>
<td valign="top" align="left">23</td>
<td valign="top" align="left">EIL</td>
<td valign="top" align="left">6</td>
</tr>
<tr>
<td valign="top" align="left">bHLH</td>
<td valign="top" align="left">123</td>
<td valign="top" align="left">FAR1</td>
<td valign="top" align="left">21</td>
<td valign="top" align="left">YABBY</td>
<td valign="top" align="left">6</td>
</tr>
<tr>
<td valign="top" align="left">ERF</td>
<td valign="top" align="left">123</td>
<td valign="top" align="left">ARF</td>
<td valign="top" align="left">19</td>
<td valign="top" align="left">BBR-BPC</td>
<td valign="top" align="left">5</td>
</tr>
<tr>
<td valign="top" align="left">NAC</td>
<td valign="top" align="left">108</td>
<td valign="top" align="left">AP2</td>
<td valign="top" align="left">15</td>
<td valign="top" align="left">CPP</td>
<td valign="top" align="left">4</td>
</tr>
<tr>
<td valign="top" align="left">C2H2</td>
<td valign="top" align="left">97</td>
<td valign="top" align="left">TALE</td>
<td valign="top" align="left">15</td>
<td valign="top" align="left">LSD</td>
<td valign="top" align="left">3</td>
</tr>
<tr>
<td valign="top" align="left">WRKY</td>
<td valign="top" align="left">66</td>
<td valign="top" align="left">CO-like</td>
<td valign="top" align="left">13</td>
<td valign="top" align="left">RAV</td>
<td valign="top" align="left">3</td>
</tr>
<tr>
<td valign="top" align="left">bZIP</td>
<td valign="top" align="left">59</td>
<td valign="top" align="left">NF-YB</td>
<td valign="top" align="left">13</td>
<td valign="top" align="left">HB-PHD</td>
<td valign="top" align="left">2</td>
</tr>
<tr>
<td valign="top" align="left">MYB_related</td>
<td valign="top" align="left">56</td>
<td valign="top" align="left">ZF-HD</td>
<td valign="top" align="left">13</td>
<td valign="top" align="left">HRT-like</td>
<td valign="top" align="left">2</td>
</tr>
<tr>
<td valign="top" align="left">B3</td>
<td valign="top" align="left">54</td>
<td valign="top" align="left">GeBP</td>
<td valign="top" align="left">12</td>
<td valign="top" align="left">NF-X1</td>
<td valign="top" align="left">2</td>
</tr>
<tr>
<td valign="top" align="left">M-type_MADS</td>
<td valign="top" align="left">53</td>
<td valign="top" align="left">SBP</td>
<td valign="top" align="left">12</td>
<td valign="top" align="left">Whirly</td>
<td valign="top" align="left">2</td>
</tr>
<tr>
<td valign="top" align="left">GRAS</td>
<td valign="top" align="left">49</td>
<td valign="top" align="left">ARR-B</td>
<td valign="top" align="left">11</td>
<td valign="top" align="left">LFY</td>
<td valign="top" align="left">1</td>
</tr>
<tr>
<td valign="top" align="left">G2-like</td>
<td valign="top" align="left">40</td>
<td valign="top" align="left">GRF</td>
<td valign="top" align="left">10</td>
<td valign="top" align="left">S1Fa-like</td>
<td valign="top" align="left">1</td>
</tr>
<tr>
<td valign="top" align="left">HD-ZIP</td>
<td valign="top" align="left">40</td>
<td valign="top" align="left">NF-YC</td>
<td valign="top" align="left">10</td>
<td valign="top" align="left">SAP</td>
<td valign="top" align="left">1</td>
</tr>
<tr>
<td valign="top" align="left">LBD</td>
<td valign="top" align="left">37</td>
<td valign="top" align="left">Nin-like</td>
<td valign="top" align="left">9</td>
<td valign="top" align="left">STAT</td>
<td valign="top" align="left">1</td>
</tr>
<tr>
<td valign="top" align="left">C3H</td>
<td valign="top" align="left">36</td>
<td valign="top" align="left">WOX</td>
<td valign="top" align="left">9</td>
<td valign="top" align="left">VOZ</td>
<td valign="top" align="left">1</td>
</tr>
<tr>
<td valign="top" align="left">MIKC_MADS</td>
<td valign="top" align="left">32</td>
<td valign="top" align="left">DBB</td>
<td valign="top" align="left">8</td>
<td valign="top" align="left">E2F/DP</td>
<td valign="top" align="left">7</td>
</tr>
<tr>
<td valign="top" align="left">Trihelix</td>
<td valign="top" align="left">31</td>
<td valign="top" align="left">HB-other</td>
<td valign="top" align="left">8</td>
<td valign="top" align="left">SRS</td>
<td valign="top" align="left">7</td>
</tr>
<tr>
<td valign="top" align="left">Dof</td>
<td valign="top" align="left">30</td>
<td valign="top" align="left">NF-YA</td>
<td valign="top" align="left">8</td>
<td/>
<td/>
</tr>
<tr>
<td valign="top" align="left">GATA</td>
<td valign="top" align="left">23</td>
<td valign="top" align="left">BES1</td>
<td valign="top" align="left">7</td>
<td/>
<td/>
</tr>
<tr>
<td valign="top" align="left">HSF</td>
<td valign="top" align="left">23</td>
<td valign="top" align="left">CAMTA</td>
<td valign="top" align="left">6</td>
<td/>
<td/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="S2.SS7">
<title>Microsatellite identification</title>
<p>The masked genome was used to identify simple sequence repeats (SSRs) by using two different tools (MISA and PERF). Since PERF does not identify complex/compound SSRs, we retained outcomes from MISA only. A total length of 2.52 Mb or approximately 0.7% was identified as SSRs in the genome. Then SSRs were divided into three categories according to their length as follows: (1) &#x2264; 12 bp, (2) 12&#x2013;19 bp, and (3) &#x2265; 20 bp. SSRs &#x2264; 12 bp were higher in number than the other SSR categories, and mononucleotide SSRs were in very high abundance (<xref ref-type="table" rid="T7">Table 7</xref>).</p>
<table-wrap position="float" id="T7">
<label>TABLE 7</label>
<caption><p>Identified simple sequent repeats in pomegranate genome.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Type</td>
<td valign="top" align="center">Number (&#x2264; 12 bp)</td>
<td valign="top" align="center">Number (12&#x2013;19 bp)</td>
<td valign="top" align="center">Number (&#x2265; 20 bp)</td>
<td valign="top" align="center">Length covered by SSRs</td>
<td valign="top" align="center">Software</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Mono</td>
<td valign="top" align="center">63,194</td>
<td valign="top" align="center">16,369</td>
<td valign="top" align="center">3,055</td>
<td valign="top" align="center">10,01,124</td>
<td valign="top" align="center">MISA and PERF</td>
</tr>
<tr>
<td valign="top" align="left">Di</td>
<td valign="top" align="center">10,771</td>
<td valign="top" align="center">28,324</td>
<td valign="top" align="center">1,9387</td>
<td valign="top" align="center">11,41,770</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Tri</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">8,641</td>
<td valign="top" align="center">4,820</td>
<td valign="top" align="center">2,73,408</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Tetra</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">1,695</td>
<td valign="top" align="center">1,128</td>
<td valign="top" align="center">64,698</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Penta</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">799</td>
<td valign="top" align="center">22,000</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Hexa</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">0</td>
<td valign="top" align="center">553</td>
<td valign="top" align="center">18,185</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Total</td>
<td valign="top" align="center">73,965</td>
<td valign="top" align="center">55,029</td>
<td valign="top" align="center">29,742</td>
<td valign="top" align="center">25,21,185</td>
<td/>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="S2.SS8">
<title>MicroRNA (miRNA) classification</title>
<p>miRNAs are important regulators of several biological processes, such as plant growth and development. These are 20&#x2013;24 nt in length. A total of 314 copies of miRNAs belonging to 26 different families were identified in the &#x2018;Bhagawa&#x2019; genome (<xref ref-type="fig" rid="F8">Figure 8</xref>).</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption><p>MicroRNAs representing 26 different families identified in the &#x2018;Bhagawa&#x2019; genome.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fpls-13-947164-g008.tif"/>
</fig>
</sec>
</sec>
<sec id="S3" sec-type="discussion">
<title>Discussion</title>
<p>A high-quality complete genome assembly is a valuable genomic resource for identifying structural variants, gene and marker discovery, integrating phenotype&#x2013;genotype associations, and elucidating the crop&#x2019;s genome evolution and genetic architecture. The genome sequence information can also be used to understand the phylogenetic position of pomegranate and to identify rapidly evolving gene families in the <italic>Punica</italic> clade in relation to other sequenced plant genomes. The reference-quality pomegranate genome assembled in the present study would certainly be a valuable resource for dissecting many important biological and metabolic traits and a powerful tool to accelerate the pomegranate crop improvement program (<xref ref-type="bibr" rid="B44">Qin et al., 2017</xref>).</p>
<p>During the earlier years of the next-generation sequencing revolution, genomes were chiefly assembled by using short-read approaches. However, short-read&#x2013;based genome assemblies and subsequent data analyzes have major fallacies, such as the inability to span highly repetitive regions longer than the read length and heterozygosity resolution (<xref ref-type="bibr" rid="B62">Xu and Wang, 2007</xref>; <xref ref-type="bibr" rid="B48">Simao et al., 2015</xref>; <xref ref-type="bibr" rid="B2">Ananthasayanam et al., 2019</xref>). The latest fourth-generation sequencing platforms, such as PacBio Sequel, 10X Genomics, and Optical mapping using BioNano, can play a significant role in improving the quality of assembled genomes with a considerable reduction in cost and time required for sequencing. These tools can generate long-read sequences aimed to resolve the above issues but with significantly more errors. So, using a hybrid approach with third-generation sequencing technologies, such as Illumina, and fourth-generation sequencing platforms, such as PacBio Sequel, the quality of the genome assembly can be improved significantly at an affordable cost. The quality of the genome assembled using the hybrid technologies are highly efficient to those assembled using only one sequencing platform. We have demonstrated how a combination of commercially available technologies from Illumina, 10X Genomics, and BioNano Genomics can efficiently be used to assemble high-quality <italic>de novo</italic> sequence scaffolds. Optical mapping for super-scaffolding on long PacBio reads and 10X chromium synthetic-linked reads for assembling a highly contiguous genome was also recommended by other researchers (<xref ref-type="bibr" rid="B35">Mostovoy et al., 2016</xref>; <xref ref-type="bibr" rid="B2">Ananthasayanam et al., 2019</xref>).</p>
<p>The N50 value of 16.12 Mb, genome coverage of more than 98% within 342 scaffolds, LAI value of 10, and 93.68% BUSCO completeness score over the 1,440 ortholog genes of the complete pomegranate genome indicate the quality of the pomegranate genome assembled in the present study. The better N50 contig length (6.8 Mb) and high N50 scaffold value (16.12 Mb) as compared to the published pomegranate genomes of &#x2018;Taishanhong&#x2019; (97 Kb, 1.7 Mb) and &#x2018;Dabenzi&#x2019; (82.31 Kb, 2.3 Mb), as well as covering more than 98% of the genome in 342 scaffolds as compared to 2117 and 2601 scaffolds for a lesser percentage of genome coverage in &#x2018;Taishanhong&#x2019; and &#x2018;Dabenzi,&#x2019; respectively, indicates the high quality of the assembled genome of pomegranate cv. &#x2018;Bhagawa&#x2019; (<xref ref-type="bibr" rid="B44">Qin et al., 2017</xref>; <xref ref-type="bibr" rid="B64">Yuan Z. et al., 2018</xref>). Programs such as the LTR retriever RepeatMasker and RepeatModeler are mostly used for accurate <italic>de novo</italic> identification of intact LTR retrotransposons (<xref ref-type="bibr" rid="B62">Xu and Wang, 2007</xref>; <xref ref-type="bibr" rid="B12">Ellinghaus et al., 2008</xref>; <xref ref-type="bibr" rid="B41">Ou and Jiang, 2018</xref>; <xref ref-type="bibr" rid="B65">Zhang et al., 2019</xref>). More intact LTR elements could be identified from more completed genomes as compared with draft genomes (<xref ref-type="bibr" rid="B41">Ou and Jiang, 2018</xref>). In turn, the amount of identifiable intact LTR elements can indicate the assembly quality of the intergenic and repetitive sequence space. The LAI can be an indicator of the completeness of the genome, where LAI &#x003C; 10 can be considered draft assembly, LAI 10&#x2013;19 reference-quality assembly, and LAI &#x2265; 20 gold-standard assembly (<xref ref-type="bibr" rid="B40">Ou et al., 2018</xref>).</p>
<p>Similarly, completeness is better gaged by using a set of genes that are universally distributed as orthologs across particular clades of species (<xref ref-type="bibr" rid="B56">Treangen and Salzberg, 2012</xref>). A summary of complete single-copy, duplicated, fragmented, and missing BUSCO genes is often provided as a quantitative measure of genome completeness based on expected gene content (<xref ref-type="bibr" rid="B48">Simao et al., 2015</xref>; <xref ref-type="bibr" rid="B47">Seppey et al., 2019</xref>). These transcription factors play a pivotal role in the developmental regulation of gene expression and response of plants to various biotic and abiotic stresses. The most predominant transcription factors in the pomegranate genome were MYB, bHLH, ERF, NAC, and C2H2 families, and these are involved in defense, developmental regulation of gene expression, the response of plants to various biotic and abiotic stresses, and the detoxification response related to drought (<xref ref-type="bibr" rid="B49">Singh et al., 2012</xref>; <xref ref-type="bibr" rid="B33">Mittal et al., 2018</xref>). The bHLH family is related to drought stress by regulating stomatal development, meristemoid differentiation, and guard cell morphogenesis (<xref ref-type="bibr" rid="B43">Pillitteri et al., 2007</xref>). miRNAs are important regulators of several biological processes and stress responses. We identified 314 copies of miRNA belonging to 26 different families (<xref ref-type="bibr" rid="B24">Jones-Rhoades et al., 2006</xref>; <xref ref-type="bibr" rid="B54">Sunkar et al., 2007</xref>; <xref ref-type="bibr" rid="B49">Singh et al., 2012</xref>).</p>
<p>The reference-quality genome assembly of the &#x2018;Bhagawa&#x2019; genome in the current study will be an invaluable resource to molecular studies in &#x2018;Bhagawa&#x2019; and other species related to pomegranate.</p>
</sec>
<sec id="S4" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="S4.SS1">
<title>Plant materials</title>
<p>The most commercially grown and popular Indian pomegranate cultivar &#x2018;Bhagawa&#x2019; was chosen for genome sequencing. The variety is currently being maintained at field Gene Bank of ICAR-NRCP, Solapur, India. This variety has a medium plant height (1.5 mt), bearing deep red fruits with large size (&#x003E;250 g), thick rind having dark red-colored bold arils with the soft seed type. The soft red arils of this variety are mainly preferred for edible and processing purposes because of their higher juice percentage (45%), TSS (15.9&#x00B0;Brix), vitamin C (14.60 mg/100 g fresh arils), anthocyanin (360 mg/100 g), iron (0.32 mg/100 g), and zinc (0.50 mg/100 g) content. This variety is a late-maturing type (180 days from flowering to harvesting) with a high yield potential (20 tonnes/ha) widely grown across the country. The newly emerged leaves were taken for DNA isolation and subsequent downstream operations.</p>
</sec>
<sec id="S4.SS2">
<title>Genome sequencing</title>
<p>High-molecular-weight genomic DNA (&#x003E;50 Kb) extraction and purification were performed using the Genomic-tip 100/G genomic DNA isolation kit (Qiagen). DNA concentration was measured by using NanoDrop (Thermo Fisher Scientific) and Qubit 2.0 (Invitrogen) instruments. The integrity and quality of genomic DNA were confirmed by using the Bio-Rad<sup>&#x00AE;</sup> CHEF Mapper<sup>&#x00AE;</sup> XA Pulsed Field Electrophoresis system. High-quality sequencing data were generated using four different sequencing and mapping technologies (i.e., Illumina, 10X Chromium, PacBio Sequel, and DLS BioNanoSaphyr optical mapping). Illumina sequencing libraries were constructed by using the NEBNext UltraTM DNA Library Prep Kit (Illumina). The 10X Chromium genomic libraries were prepared by using the Chromium Genome HT Library Kit and Gel Bead Kit v2. The SMRTbell library was prepared using SMRTbell Express Template Preparation Kit. For the construction of optical genome maps, standard BioNano protocols, nicking, labeling, repair, and staining processes were implemented. Specifically, DNA was digested by the single-stranded nicking endonuclease Nt.BspQI. Optical maps were assembled with BioNano Irys View analysis software; only single molecules with a minimum length of 100 kb and six labels per molecule were used.</p>
</sec>
<sec id="S4.SS3">
<title>Genome assembly</title>
<p>We performed a genome survey using the 10X Chromium datasets before the genome assembly. Initially, the data were de-barcoded by using scaff_reads from Scaff10x v4. Kmer-genie was used to generate histograms at multiple k-mers. The histogram from <italic>k</italic> = 31 was used to run GenomeScope v1.0 at a maximum k-mer coverage of 10,000 for estimating the genome size, heterozygosity, and repetitive and unique content of the genome (<xref ref-type="bibr" rid="B59">Vurture et al., 2017</xref>). After this, we proceeded with genome assembly step by step by using various datasets obtained from the sequencing. The genome was assembled by using the Falcon and Phased falcon-unzip module (<xref ref-type="bibr" rid="B9">Chin et al., 2017</xref>). The unzipped genome was polished by using Arrow as a part of the unzipping pipeline. Then the genome was scaffolded iteratively twice by using Scaff10X v4<sup><xref ref-type="fn" rid="footnote3">3</xref></sup> with the de-barcoded 10X Chromium reads. BioNano Tools 1v.3.8041.8044 and Solve 3.3_10252018 were used to build a consensus genome map by using molecules &#x003E; 150 Kb long and hosting 8 labels (<xref ref-type="bibr" rid="B53">Stankova et al., 2016</xref>).</p>
<p>The <italic>de novo</italic> assembled Optical Maps were then used to super-scaffold the Scaff10X scaffolded genome by using the Hybrid Scaffolds tool from the same BioNano solve release (<xref ref-type="bibr" rid="B53">Stankova et al., 2016</xref>). Gaps introduced by both Scaff10X and Hybrid Scaffolds toolkits were filled by using PBJelly2 once and later by polishing using Pilon, and BUSCO v3 used with Embryophyta lineage constituting 1440 orthologs was performed at each step to determine the completeness of the genome assembly (<xref ref-type="bibr" rid="B14">English et al., 2012</xref>; <xref ref-type="bibr" rid="B60">Walker et al., 2014</xref>; <xref ref-type="bibr" rid="B48">Simao et al., 2015</xref>). Additionally, on the Pilon-polished genome, we mapped transcriptome data (SRR5187757, SRR5187758, SRR5187763, and SRR5187764) of four samples by using HiSAT2 to check for gene-model completion and to aid in the annotation process (<xref ref-type="bibr" rid="B26">Kim et al., 2014</xref>; <xref ref-type="bibr" rid="B16">Geib et al., 2018</xref>). Deep-Sequenced Illumina short-read datasets were mapped to the genome by using BWA, and subsequent alignments were used to polish the genome by using Pilon. Assemblies from the &#x2018;Dabenzi&#x2019; and &#x2018;Taishanhong&#x2019; cultivars were aligned to &#x2018;Bhagawa&#x2019; by using the &#x201C;asm5&#x201D; parameter from minimap2. Various other genomes, <italic>Arabidopsis thaliana, Vitis vinifera, E. grandis</italic>, and <italic>Theobroma cacoa</italic>, were aligned with &#x2018;Bhagawa&#x2019; by using the &#x201C;asm10&#x201D; parameter. Variants were called from the alignments by using Assemblytics (<xref ref-type="bibr" rid="B37">Nattestad and Schatz, 2016</xref>), commit df5361f from GitHub from sizes 1&#x2013;10,000, with a unique anchor length of 10 kb.</p>
<p>Circos Jupiter graphs were plotted to check the assembly continuity and any misassembles between the &#x2018;Dabenzi&#x2019; and &#x2018;Taishanhong&#x2019; genomes with respect to the &#x2018;Bhagawa&#x2019; genome. We used the largest scaffolds representing 75% of the genome length, consisting of scaffolds &#x003E; 100 Kb long and with no breakages for at least 50 Kb. Scaffolds were broken into fragments if there was a continuous stretch of 100 Kb, then &#x201C;N&#x201D;&#x2019;s had to be removed (i.e., false alignments). The alignments were computed by using Minimap2 with the parameter &#x201C;asm10&#x201D;<sup><xref ref-type="fn" rid="footnote4">4</xref></sup>.</p>
</sec>
<sec id="S4.SS4">
<title>Genome annotation</title>
<p>To identify and classify different repeats in the pomegranate genome sequences, we used the RepeatModeler-open-1.0.10 pipeline to construct a <italic>de novo</italic> repeat library (<xref ref-type="bibr" rid="B51">Smit et al., 2008</xref>). Repeat sequences related to the <italic>Punica</italic> genus were obtained from the RepeatMasker library to classify the repeats by using RepeatClassifier. <italic>De novo</italic> identified repeat sequences, and plant-related repeat sequences were merged to create a custom library. Masking of the genome involved using RepeatMasker v 4.0.9 with the custom library (<xref ref-type="bibr" rid="B55">Tarailo-Graovac and Nansheng, 2009</xref>).</p>
<p>We created an orthologs protein set of 4 plant species, including <italic>V. vinifera</italic>, <italic>P. granatum</italic> (&#x2018;Dabenzi&#x2019;), <italic>T. cacao</italic>, and <italic>E. grandis</italic> by using OrthoVenn 2 (<xref ref-type="bibr" rid="B61">Wang et al., 2015</xref>). Ortholog protein sets shared by at least two species were submitted to BRAKER2.0 using &#x2013;prg = gth and &#x2013;prot_seq options. GTFs from the mapped transcriptome data were merged by using StringTie v1.3.6 to create a catalog of putative transcripts (<xref ref-type="bibr" rid="B42">Pertea et al., 2015</xref>). BRAKER2.0 was used to train Augustus v3.3 with the merged GTF and protein alignments (<xref ref-type="bibr" rid="B52">Stanke et al., 2006</xref>). Gene models were further improved <italic>via</italic> MAKER2 by providing the gff file generated by using Augustus v3.3, the protein alignment file generated through genome threader (gth), and a CDS file generated by using StringTie v1.3.6; MAKER2 was run iteratively twice to refine the gene predictions (<xref ref-type="bibr" rid="B7">Cantarel et al., 2008</xref>).</p>
<p>The predicted gene set was annotated by using EggNOG mapper and blasted against the UniProt<sup><xref ref-type="fn" rid="footnote5">5</xref></sup> <italic>Viridi plantae</italic> dataset and InterProScan to filter out false-positives generated by MAKER2 (<xref ref-type="bibr" rid="B58">Van Nguyen and Dominique, 2009</xref>; <xref ref-type="bibr" rid="B23">Jones et al., 2014</xref>; <xref ref-type="bibr" rid="B21">Huerta-Cepas et al., 2017</xref>). The curated gene sets were re-annotated by using the same databases. Finally, genome Annotation Generator (GAG) v2.0. was used to add start and stop codons and identify various metrics based on the annotated GFF (<xref ref-type="bibr" rid="B16">Geib et al., 2018</xref>). Genes flagged as overlapping or contained by GAG were removed by using BedTools Intersect.</p>
</sec>
<sec id="S4.SS5">
<title>Microsatellites identification</title>
<p>High-throughput SSRs were identified by using MISA (<xref ref-type="bibr" rid="B4">Beier et al., 2017</xref>) and PERF v0.2.5 with the same parameters (<xref ref-type="bibr" rid="B3">Avvaru et al., 2017</xref>). The parameters used were minimum SSR motif length of 10 bp and repeat length mono-10, di-6, tri-5, tetra-5, penta-5, and hexa-5; the maximum size of interruption allowed between two different SSRs in a compound sequence was 100 bp. Concordant SSRs between the two approaches were chosen by using Bedtools Intersect (<xref ref-type="bibr" rid="B45">Quinlan, 2010</xref>) with a 90% reciprocal overlap.</p>
</sec>
</sec>
<sec id="S5">
<title>Resistance genes and transcription factor identification</title>
<p>Plant stress resistance genes were downloaded from Plant Stress Protein Database (PSPDB<sup><xref ref-type="fn" rid="footnote6">6</xref></sup> <sup>,<xref ref-type="fn" rid="footnote7">7</xref></sup>) (<xref ref-type="bibr" rid="B29">Kumar et al., 2014</xref>). To identify resistance genes in pomegranate, we performed a Blastp of predicted protein sequences of pomegranate against downloaded protein sequences of resistance genes with e-value cutoff (1e-5), query coverage (50%), and sequence identity (50%) (<xref ref-type="bibr" rid="B1">Altschul et al., 1997</xref>). Transcription factors were predicted by using PlantTFDB V4.0 by selecting Arabidopsis as a reference (<xref ref-type="bibr" rid="B16">Geib et al., 2018</xref>).</p>
<sec id="S5.SS1">
<title>Orthologs identification and estimated gene gain and loss rates</title>
<p>We used Orthofinder 2.3.3 to define gene families across five genomes: <italic>P. granatum</italic> cv. &#x2018;Bhagawa,&#x2019; <italic>A. thaliana, E. grandis, T. cacao</italic>, and <italic>V. vinifera</italic> downloaded from NCBI(<xref ref-type="bibr" rid="B13">Emms David and Steven, 2015</xref>). We used the options Diamond to blast, MSA using MAFFT, and tree inference using raxml-ng (<xref ref-type="bibr" rid="B25">Katoh et al., 2005</xref>; <xref ref-type="bibr" rid="B6">Buchfink et al., 2015</xref>). CAFE 4.2.1 was used to identify expansion, contraction, and rapidly evolving gene families in the <italic>Punica</italic> clade (<xref ref-type="bibr" rid="B11">De Bie et al., 2006</xref>; <xref ref-type="bibr" rid="B57">UniProt Consortium, 2014</xref>; <xref ref-type="bibr" rid="B27">Kozlov et al., 2019</xref>; <xref ref-type="bibr" rid="B50">Singh et al., 2021</xref>). We estimated gene gain and loss rates with a two-lambda model.</p>
</sec>
</sec>
<sec id="S6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in this study are publicly available. The NCBI data accession numbers: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA445950">PRJNA445950</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA562100">PRJNA562100</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505392">PRJNA505392</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505397">PRJNA505397</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505398">PRJNA505398</ext-link>, and <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA505582">PRJNA505582</ext-link>.</p>
</sec>
<sec id="S7">
<title>Author contributions</title>
<p>PR, PS, NS, and PP: conceptualization of idea, planning of research experiments, collection and processing of samples, compilation of data, secondary analysis of data, and drafting the manuscript. PN and UR: compilation of data, and secondary analysis of data and drafting the manuscript. JS, KB, and RM: drafting the manuscript and review of the manuscript. VS and DM: collection and processing of samples. All authors contributed to the article and approved the submitted version.</p>
</sec>
</body>
<back>
<sec id="S8" sec-type="funding-information">
<title>Funding</title>
<p>This project was fully funded by the Indian Council of Agricultural Research, New Delhi, under the project draft genome sequencing of pomegranate (<italic>Punica granatum</italic> L.) (Project code- IXX13119).</p>
</sec>
<ack>
<p>All authors acknowledge the Indian Council of Agricultural Research, New Delhi, for financial support and the authors are thankful to Mr. Dushyant Singh Baghel, Nucleome Informatics Pvt. Ltd., Hyderabad, for the sequencing work.</p>
</ack>
<sec id="S9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="S10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="S11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2022.947164/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2022.947164/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="DS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.XLSX" id="TS2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_3.XLSX" id="TS3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<fn-group>
<fn id="footnote1"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="http://nhb.gov.in">http://nhb.gov.in</ext-link></p></fn>
<fn id="footnote2"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="http://agriexchange.apeda.gov.in">http://agriexchange.apeda.gov.in</ext-link></p></fn>
<fn id="footnote3"><label>3</label><p><ext-link ext-link-type="uri" xlink:href="https://github.com/wtsi-hpag/Scaff10X">https://github.com/wtsi-hpag/Scaff10X</ext-link></p></fn>
<fn id="footnote4"><label>4</label><p><ext-link ext-link-type="uri" xlink:href="https://github.com/JustinChu/JupiterPlot.git">https://github.com/JustinChu/JupiterPlot.git</ext-link></p></fn>
<fn id="footnote5"><label>5</label><p><ext-link ext-link-type="uri" xlink:href="http://www.uniprot.org">www.uniprot.org</ext-link></p></fn>
<fn id="footnote6"><label>6</label><p><ext-link ext-link-type="uri" xlink:href="https://bioclues.org">https://bioclues.org</ext-link></p></fn>
<fn id="footnote7"><label>7</label><p><ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Altschul</surname> <given-names>S. F.</given-names></name> <name><surname>Madden</surname> <given-names>T.</given-names></name> <name><surname>Sch&#x00E4;ffer</surname> <given-names>A. A.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Miller</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>1997</year>). <article-title>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>25</volume> <fpage>3389</fpage>&#x2013;<lpage>3402</lpage>.</citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ananthasayanam</surname> <given-names>S.</given-names></name> <name><surname>Kothandaraman</surname> <given-names>H.</given-names></name> <name><surname>Nayee</surname> <given-names>N.</given-names></name> <name><surname>Saha</surname> <given-names>S.</given-names></name> <name><surname>Baghel</surname> <given-names>D. S.</given-names></name> <name><surname>Gopalakrishnan</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>First near complete haplotype phased genome assembly of River buffalo (<italic>Bubalus bubalis</italic>).</article-title> <source><italic>BioRxiv</italic> [Preprint]</source>. <pub-id pub-id-type="doi">10.1101/618785</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Avvaru</surname> <given-names>A. K.</given-names></name> <name><surname>Sowpati</surname> <given-names>D. T.</given-names></name> <name><surname>Mishra</surname> <given-names>R. K.</given-names></name></person-group> (<year>2017</year>). <article-title>PERF: an exhaustive algorithm for ultra-fast and efficient identification of microsatellites from large DNA sequences.</article-title> <source><italic>Bioinformatics</italic></source> <volume>34</volume> <fpage>943</fpage>&#x2013;<lpage>948</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx721</pub-id> <pub-id pub-id-type="pmid">29121165</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beier</surname> <given-names>S.</given-names></name> <name><surname>Thiel</surname> <given-names>T.</given-names></name> <name><surname>M&#x00FC;nch</surname> <given-names>T.</given-names></name> <name><surname>Scholz</surname> <given-names>U.</given-names></name> <name><surname>Mascher</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>MISA-web: a web server for microsatellite prediction.</article-title> <source><italic>Bioinformatics</italic></source> <volume>33</volume> <fpage>2583</fpage>&#x2013;<lpage>2585</lpage>.</citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Berger</surname> <given-names>B. A.</given-names></name> <name><surname>Kriebel</surname> <given-names>R.</given-names></name> <name><surname>Spalink</surname> <given-names>D.</given-names></name> <name><surname>Sytsma</surname> <given-names>K. J.</given-names></name></person-group> (<year>2016</year>). <article-title>Divergence times, historical biogeography, and shifts in speciation rates of Myrtales.</article-title> <source><italic>Mol. Phylogenet. Evol.</italic></source> <volume>95</volume> <fpage>116</fpage>&#x2013;<lpage>136</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2015.10.001</pub-id> <pub-id pub-id-type="pmid">26585030</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buchfink</surname> <given-names>B.</given-names></name> <name><surname>Xie</surname> <given-names>C.</given-names></name> <name><surname>Huson</surname> <given-names>D. H.</given-names></name></person-group> (<year>2015</year>). <article-title>Fast and sensitive protein alignment using diamond.</article-title> <source><italic>Nat. Methods</italic></source> <volume>12</volume>:<issue>59</issue>. <pub-id pub-id-type="doi">10.1038/nmeth.3176</pub-id> <pub-id pub-id-type="pmid">25402007</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cantarel</surname> <given-names>B. L.</given-names></name> <name><surname>Korf</surname> <given-names>I.</given-names></name> <name><surname>Robb</surname> <given-names>S. M.</given-names></name> <name><surname>Parra</surname> <given-names>G.</given-names></name> <name><surname>Ross</surname> <given-names>E.</given-names></name> <name><surname>Moore</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Maker: an easy-to-use annotation pipeline designed for emerging model organism genomes.</article-title> <source><italic>Genome Res.</italic></source> <volume>18</volume> <fpage>188</fpage>&#x2013;<lpage>196</lpage>. <pub-id pub-id-type="doi">10.1101/gr.6743907</pub-id> <pub-id pub-id-type="pmid">18025269</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chandra</surname> <given-names>R.</given-names></name> <name><surname>Dhinesh Babu</surname> <given-names>K.</given-names></name> <name><surname>Jadhav</surname> <given-names>T. V.</given-names></name> <name><surname>Teixeira da Silva</surname> <given-names>J. A.</given-names></name></person-group> (<year>2010</year>). <article-title>Origin, history and domestication of pomegranate.</article-title> <source><italic>Fruit Veg. Cereal Sci. Biotechnol.</italic></source> <volume>2</volume> <fpage>1</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1093/aob/mcv077</pub-id> <pub-id pub-id-type="pmid">26141130</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chin</surname> <given-names>C. S.</given-names></name> <name><surname>Peluso</surname> <given-names>P.</given-names></name> <name><surname>Sedlazeck</surname> <given-names>F.</given-names></name> <name><surname>Nattestad</surname> <given-names>M.</given-names></name> <name><surname>Concepcion</surname> <given-names>G. T.</given-names></name> <name><surname>Clum</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Phased diploid genome assembly with single-molecule real-time sequencing.</article-title> <source><italic>Nat Methods</italic></source> <volume>13</volume>:<issue>1050</issue>.</citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>da Silva</surname> <given-names>J. T.</given-names></name> <name><surname>Rana</surname> <given-names>T. S.</given-names></name> <name><surname>Narzary</surname> <given-names>D. S.</given-names></name> <name><surname>Verma</surname> <given-names>N.</given-names></name> <name><surname>Meshram</surname> <given-names>D. T.</given-names></name> <name><surname>Ranade</surname> <given-names>S. A.</given-names></name></person-group> (<year>2013</year>). <article-title>Pomegranate biology and biotechnology: a review.</article-title> <source><italic>Sci. Hortic.</italic></source> <volume>160</volume> <fpage>85</fpage>&#x2013;<lpage>107</lpage>.</citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Bie</surname> <given-names>T.</given-names></name> <name><surname>Cristianini</surname> <given-names>N.</given-names></name> <name><surname>Demuth</surname> <given-names>J. P.</given-names></name> <name><surname>Hahn</surname> <given-names>M. W.</given-names></name></person-group> (<year>2006</year>). <article-title>CAFE: a computational tool for the study of gene family evolution.</article-title> <source><italic>Bioinformatics</italic></source> <volume>22</volume> <fpage>1269</fpage>&#x2013;<lpage>1271</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btl097</pub-id> <pub-id pub-id-type="pmid">16543274</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ellinghaus</surname> <given-names>D.</given-names></name> <name><surname>Kurtz</surname> <given-names>S.</given-names></name> <name><surname>Willhoeft</surname> <given-names>U.</given-names></name></person-group> (<year>2008</year>). <article-title>LTRharvest, an efficient and flexible software for de novo detection of LTR retrotransposons.</article-title> <source><italic>BMC Bioinform.</italic></source> <volume>9</volume>:<issue>18</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-9-18</pub-id> <pub-id pub-id-type="pmid">18194517</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emms David</surname> <given-names>M.</given-names></name> <name><surname>Steven</surname> <given-names>K.</given-names></name></person-group> (<year>2015</year>). <article-title>OrthoFinder: solving fundamental biases in whole genome comparisons dramatically improves orthogroup inference accuracy.</article-title> <source><italic>Gen. Bio.</italic></source> <volume>16</volume>:<issue>157</issue>. <pub-id pub-id-type="doi">10.1186/s13059-015-0721-2</pub-id> <pub-id pub-id-type="pmid">26243257</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>English</surname> <given-names>A. C.</given-names></name> <name><surname>Richards</surname> <given-names>S.</given-names></name> <name><surname>Han</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Vee</surname> <given-names>V.</given-names></name> <name><surname>Qu</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Mind the gap: upgrading genomes with Pacific Biosciences RS long-read sequencing technology.</article-title> <source><italic>PLoS One</italic></source> <volume>7</volume>:<issue>e47768</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0047768</pub-id> <pub-id pub-id-type="pmid">23185243</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ferrara</surname> <given-names>G.</given-names></name> <name><surname>Selahvarzi</surname> <given-names>Y.</given-names></name> <name><surname>Ahmadpourmir</surname> <given-names>H.</given-names></name> <name><surname>Mazzea</surname> <given-names>A.</given-names></name> <name><surname>Giancaspro</surname> <given-names>A.</given-names></name></person-group> (<year>2021</year>). &#x201C;<article-title>Productionand Growing area</article-title>,&#x201D; in <source><italic>The Pomegranate: Botany, Production and Uses</italic></source>, <role>eds</role> <person-group person-group-type="editor"><name><surname>Sarkhosh</surname> <given-names>A.</given-names></name> <name><surname>Yavari</surname> <given-names>A. M.</given-names></name> <name><surname>Zamani</surname> <given-names>Z.</given-names></name></person-group> (<publisher-loc>Wallingford, UK</publisher-loc>: <publisher-name>CABI International</publisher-name>), <fpage>59</fpage>&#x2013;<lpage>93</lpage>.</citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Geib</surname> <given-names>S. M.</given-names></name> <name><surname>Hall</surname> <given-names>B.</given-names></name> <name><surname>Derego</surname> <given-names>T.</given-names></name> <name><surname>Bremer</surname> <given-names>F. T.</given-names></name> <name><surname>Cannoles</surname> <given-names>K.</given-names></name> <name><surname>Sim</surname> <given-names>B. S.</given-names></name></person-group> (<year>2018</year>). <article-title>Genome Annotation Generator: a simple tool for generating and correcting WGS annotation tables for NCBI submission.</article-title> <source><italic>Giga Sci.</italic></source> <volume>7</volume>:<issue>4</issue>. <pub-id pub-id-type="doi">10.1093/gigascience/giy018</pub-id> <pub-id pub-id-type="pmid">29635297</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Graham</surname> <given-names>S. A.</given-names></name> <name><surname>Graham</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>Ovary, fruit, and seed morphology of the <italic>Lythraceae</italic>.</article-title> <source><italic>Int. Plant Sci.</italic></source> <volume>175</volume> <fpage>202</fpage>&#x2013;<lpage>204</lpage>.</citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guarino</surname> <given-names>L. T.</given-names></name> <name><surname>Miller</surname> <given-names>M.</given-names></name> <name><surname>Baazara</surname> <given-names>N.</given-names></name></person-group> (<year>1990</year>). <article-title>Obadi. Socotra: the island of Bliss revisited.</article-title> <source><italic>Diversity</italic></source> <volume>6</volume> <fpage>28</fpage>&#x2013;<lpage>31</lpage>.</citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Halvorsen</surname> <given-names>B. L.</given-names></name> <name><surname>Holte</surname> <given-names>K.</given-names></name> <name><surname>Myhrstad</surname> <given-names>M. C. W.</given-names></name> <name><surname>Barikmo</surname> <given-names>I.</given-names></name> <name><surname>Hvattum</surname> <given-names>E.</given-names></name> <name><surname>Remberg</surname> <given-names>S. F.</given-names></name><etal/></person-group> (<year>2002</year>). <article-title>A systematic screening of total antioxidants in dietary plants.</article-title> <source><italic>J. Nutr</italic>.</source> <volume>132</volume> <fpage>461</fpage>&#x2013;<lpage>471</lpage>. <pub-id pub-id-type="doi">10.1093/jn/132.3.461</pub-id> <pub-id pub-id-type="pmid">11880572</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holland</surname> <given-names>D.</given-names></name> <name><surname>Hatib</surname> <given-names>K.</given-names></name> <name><surname>Bar-Ya&#x2019;akov</surname> <given-names>I.</given-names></name></person-group> (<year>2009</year>). &#x201C;<article-title>Pomegranate: botany, horticulture, breeding</article-title>,&#x201D; in <source><italic>Horticultural Reviews</italic></source>, <role>ed.</role> <person-group person-group-type="editor"><name><surname>Janick</surname> <given-names>J.</given-names></name></person-group> (<publisher-loc>Hoboken, NJ</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons, Inc</publisher-name>), <volume>127</volume>. <pub-id pub-id-type="doi">10.1002/9780470593776.ch2</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huerta-Cepas</surname> <given-names>J.</given-names></name> <name><surname>Forslund</surname> <given-names>K.</given-names></name> <name><surname>Coelho</surname> <given-names>L. P.</given-names></name> <name><surname>Szklarczyk</surname> <given-names>D.</given-names></name> <name><surname>Jensen</surname> <given-names>L. J.</given-names></name> <name><surname>Mering</surname> <given-names>C. V.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Fast genome-wide functional annotation through orthology assignment by eggNOG-mapper.</article-title> <source><italic>Mol. Bio. Evol.</italic></source> <volume>34</volume> <fpage>2115</fpage>&#x2013;<lpage>2122</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx148</pub-id> <pub-id pub-id-type="pmid">28460117</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Johanningsmeier</surname> <given-names>S. D.</given-names></name> <name><surname>Harris</surname> <given-names>G. K.</given-names></name></person-group> (<year>2011</year>). <article-title>Pomegranate as a functional food and nutraceutical source.</article-title> <source><italic>Ann. Rev. Food Sci. Technol.</italic></source> <volume>2</volume> <fpage>181</fpage>&#x2013;<lpage>201</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-food-030810-153709</pub-id> <pub-id pub-id-type="pmid">22129380</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>P.</given-names></name> <name><surname>Binns</surname> <given-names>D.</given-names></name> <name><surname>Chang</surname> <given-names>H. Y.</given-names></name> <name><surname>McAnulla</surname> <given-names>C.</given-names></name> <name><surname>McWilliam</surname> <given-names>H.</given-names></name> <name><surname>Maslen</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>InterProScan 5: genome-scale protein function classification.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1236</fpage>&#x2013;<lpage>1240</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu031</pub-id> <pub-id pub-id-type="pmid">24451626</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones-Rhoades</surname> <given-names>M. W.</given-names></name> <name><surname>Bartel</surname> <given-names>D. P.</given-names></name> <name><surname>Bartel</surname> <given-names>B.</given-names></name></person-group> (<year>2006</year>). <article-title>MicroRNAS and their regulatory roles in plants.</article-title> <source><italic>Ann. Rev. Plant Biol.</italic></source> <volume>57</volume> <fpage>19</fpage>&#x2013;<lpage>53</lpage>.</citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname> <given-names>K.</given-names></name> <name><surname>Kuma</surname> <given-names>K.</given-names></name> <name><surname>Miyata</surname> <given-names>T.</given-names></name> <name><surname>Toh</surname> <given-names>H.</given-names></name></person-group> (<year>2005</year>). <article-title>Improvement in the accuracy of multiple sequence alignment program MAFFT.</article-title> <source><italic>Genome Inform.</italic></source> <volume>16</volume> <fpage>22</fpage>&#x2013;<lpage>33</lpage>.</citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>D.</given-names></name> <name><surname>Ben</surname> <given-names>L.</given-names></name> <name><surname>Steven</surname> <given-names>L.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2014</year>). <article-title>HISAT: a fast spliced aligner with low memory requirements.</article-title> <source><italic>Nat. Methods</italic></source> <volume>12</volume>:<issue>357</issue>. <pub-id pub-id-type="doi">10.1038/nmeth.3317</pub-id> <pub-id pub-id-type="pmid">25751142</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kozlov</surname> <given-names>A. M.</given-names></name> <name><surname>Darriba</surname> <given-names>D.</given-names></name> <name><surname>Flouri</surname> <given-names>T.</given-names></name> <name><surname>Morel</surname> <given-names>B.</given-names></name> <name><surname>Stamatakis</surname> <given-names>A.</given-names></name></person-group> (<year>2019</year>). <article-title>RAxML-NG: a fast, scalable, and user-friendly tool for maximum likelihood phylogenetic inference.</article-title> <source><italic>Bioinformatics</italic></source> <volume>35</volume> <fpage>4453</fpage>&#x2013;<lpage>4455</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz305</pub-id> <pub-id pub-id-type="pmid">31070718</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krzywinski</surname> <given-names>M.</given-names></name> <name><surname>Schein</surname> <given-names>J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name> <name><surname>Connors</surname> <given-names>J.</given-names></name> <name><surname>Gascoyne</surname> <given-names>R.</given-names></name> <name><surname>Horsman</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Circos: an information aesthetic for comparative genomics.</article-title> <source><italic>Gen. Res.</italic></source> <volume>16</volume> <fpage>39</fpage>&#x2013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1101/gr.092759.109</pub-id> <pub-id pub-id-type="pmid">19541911</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>S. A.</given-names></name> <name><surname>Kumari</surname> <given-names>P. H.</given-names></name> <name><surname>Sundararajan</surname> <given-names>V. S.</given-names></name> <name><surname>Suravajhala</surname> <given-names>P.</given-names></name> <name><surname>Kanagasabai</surname> <given-names>R.</given-names></name> <name><surname>Kavi Kishor</surname> <given-names>P. B.</given-names></name></person-group> (<year>2014</year>). <article-title>PSPDB: plant stress protein database.</article-title> <source><italic>Plant Mol. Bio. Rep.</italic></source> <volume>32</volume> <fpage>940</fpage>&#x2013;<lpage>942</lpage>. <pub-id pub-id-type="doi">10.1007/s11105-014-0698-0</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levin</surname> <given-names>G. M.</given-names></name></person-group> (<year>2006</year>). <source><italic>Pomegranate. 1st Ed.</italic></source> <publisher-loc>East Libra Drive Tempe, AZ</publisher-loc>: <publisher-name>Third Millennium Publishing</publisher-name>.</citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Wu</surname> <given-names>Z.</given-names></name> <name><surname>Yao</surname> <given-names>W.</given-names></name> <name><surname>Zhao</surname> <given-names>P.</given-names></name> <name><surname>Cao</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>The pomegranate (<italic>Punica granatum</italic> L.) draft genome dissects genetic divergence between soft- and hard-seeded cultivars.</article-title> <source><italic>Plant Biotechnol. J.</italic></source> <volume>18</volume> <fpage>955</fpage>&#x2013;<lpage>968</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.13260</pub-id> <pub-id pub-id-type="pmid">31549477</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mars</surname> <given-names>M.</given-names></name></person-group> (<year>2000</year>). <article-title>Pomegranate plant material: genetic resources and breeding, a review.</article-title> <source><italic>Options Mediterr.</italic></source> <volume>42</volume> <fpage>55</fpage>&#x2013;<lpage>62</lpage>.</citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mittal</surname> <given-names>S.</given-names></name> <name><surname>Banduni</surname> <given-names>P.</given-names></name> <name><surname>Mallikarjuna</surname> <given-names>M. G.</given-names></name> <name><surname>Jain</surname> <given-names>P. A.</given-names></name> <name><surname>Prasanta</surname> <given-names>K.</given-names></name> <name><surname>Dash</surname> <given-names>P. K.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Structural, functional, and evolutionary characterization of major drought transcription factors families in maize.</article-title> <source><italic>Front. Chem.</italic></source> <volume>6</volume>:<issue>177</issue>.</citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moriguchi</surname> <given-names>T.</given-names></name> <name><surname>Omura</surname> <given-names>M.</given-names></name> <name><surname>Matsula</surname> <given-names>N.</given-names></name> <name><surname>Kozaki</surname> <given-names>J.</given-names></name></person-group> (<year>1987</year>). <article-title><italic>In Vitro</italic> adventitious shoot formation from anthers of pomegranate.</article-title> <source><italic>Hortscience</italic></source> <volume>22</volume> <fpage>947</fpage>&#x2013;<lpage>994</lpage>.</citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mostovoy</surname> <given-names>Y.</given-names></name> <name><surname>Levy-Sakin</surname> <given-names>M.</given-names></name> <name><surname>Lam</surname> <given-names>J.</given-names></name> <name><surname>Lam</surname> <given-names>E. T.</given-names></name> <name><surname>Hastie</surname> <given-names>A. R.</given-names></name> <name><surname>Marks</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>A hybrid approach for de novo human genome sequence assembly and phasing.</article-title> <source><italic>Nat. Methods</italic></source> <volume>13</volume> <fpage>587</fpage>&#x2013;<lpage>590</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.3865</pub-id> <pub-id pub-id-type="pmid">27159086</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Myburg</surname> <given-names>A. A.</given-names></name> <name><surname>Grattapaglia</surname> <given-names>D.</given-names></name> <name><surname>Tuskan</surname> <given-names>G. A.</given-names></name> <name><surname>Hellsten</surname> <given-names>U.</given-names></name> <name><surname>Hayes</surname> <given-names>R. D.</given-names></name> <name><surname>Grimwood</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>The genome of <italic>Eucalyptus grandis</italic>.</article-title> <source><italic>Nature</italic></source> <volume>510</volume> <fpage>356</fpage>&#x2013;<lpage>362</lpage>. <pub-id pub-id-type="doi">10.1038/nature13308</pub-id> <pub-id pub-id-type="pmid">24919147</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nattestad</surname> <given-names>M.</given-names></name> <name><surname>Schatz</surname> <given-names>M. C.</given-names></name></person-group> (<year>2016</year>). <article-title>Assemblytics: a web analytics tool for the detection of variants from an assembly.</article-title> <source><italic>Bioinformatics</italic></source> <volume>32</volume> <fpage>3021</fpage>&#x2013;<lpage>3023</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btw369</pub-id> <pub-id pub-id-type="pmid">27318204</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ono</surname> <given-names>E.</given-names></name> <name><surname>Nozawa</surname> <given-names>T.</given-names></name> <name><surname>Ogata</surname> <given-names>T.</given-names></name> <name><surname>Motohashi</surname> <given-names>M.</given-names></name> <name><surname>Higo</surname> <given-names>N.</given-names></name> <name><surname>Kobayashi</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2011</year>). &#x201C;<article-title>Relationship between social interaction and mental health</article-title>,&#x201D; in <source><italic>2011 IEEE/SICE International Symposium on System Integration, SII</italic></source>, (<publisher-loc>Kyoto</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>246</fpage>&#x2013;<lpage>249</lpage>.</citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ophir</surname> <given-names>R.</given-names></name> <name><surname>Sherman</surname> <given-names>A.</given-names></name> <name><surname>Rubinstein</surname> <given-names>M.</given-names></name> <name><surname>Eshed</surname> <given-names>R.</given-names></name> <name><surname>Sharabi Schwager</surname> <given-names>M.</given-names></name> <name><surname>Harel-Beja</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Single-Nucleotide Polymorphism Markers from De-Novo Assembly of the Pomegranate Transcriptome Reveal Germplasm Genetic Diversity.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e88998</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0088998</pub-id> <pub-id pub-id-type="pmid">24558460</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ou</surname> <given-names>S.</given-names></name> <name><surname>Chen</surname> <given-names>J.</given-names></name> <name><surname>Jiang</surname> <given-names>N.</given-names></name></person-group> (<year>2018</year>). <article-title>Assessing genome assembly quality using the LTR Assembly Index (LAI).</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>46</volume>:<issue>e126</issue>. <pub-id pub-id-type="doi">10.1093/nar/gky730</pub-id> <pub-id pub-id-type="pmid">30107434</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ou</surname> <given-names>S.</given-names></name> <name><surname>Jiang</surname> <given-names>N.</given-names></name></person-group> (<year>2018</year>). <article-title>LTR retriever: a highly accurate and sensitive program for identification of long terminal repeat retrotransposons.</article-title> <source><italic>Plant Physiol.</italic></source> <volume>176</volume> <fpage>1410</fpage>&#x2013;<lpage>1422</lpage>. <pub-id pub-id-type="doi">10.1104/pp.17.01310</pub-id> <pub-id pub-id-type="pmid">29233850</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pertea</surname> <given-names>M.</given-names></name> <name><surname>Pertea</surname> <given-names>G. M.</given-names></name> <name><surname>Antonescu</surname> <given-names>C. M.</given-names></name> <name><surname>Chang</surname> <given-names>T. C.</given-names></name> <name><surname>Mendell</surname> <given-names>J. T.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2015</year>). <article-title>String Tie enables improved reconstruction of a transcriptome from RNA-seq reads.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>33</volume>:<issue>290</issue>. <pub-id pub-id-type="doi">10.1038/nbt.3122</pub-id> <pub-id pub-id-type="pmid">25690850</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pillitteri</surname> <given-names>L. J.</given-names></name> <name><surname>Sloan</surname> <given-names>D. B.</given-names></name> <name><surname>Bogenschutz</surname> <given-names>N. L.</given-names></name> <name><surname>Torii</surname> <given-names>K. U.</given-names></name></person-group> (<year>2007</year>). <article-title>Termination of asymmetric cell division and differentiation of stomata.</article-title> <source><italic>Nature</italic></source> <volume>445</volume> <fpage>501</fpage>&#x2013;<lpage>505</lpage>. <pub-id pub-id-type="doi">10.1038/nature05467</pub-id> <pub-id pub-id-type="pmid">17183267</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Qin</surname> <given-names>G.</given-names></name> <name><surname>Xu</surname> <given-names>C.</given-names></name> <name><surname>Ming</surname> <given-names>R.</given-names></name> <name><surname>Tang</surname> <given-names>H.</given-names></name> <name><surname>Guyot</surname> <given-names>R.</given-names></name> <name><surname>Kramer</surname> <given-names>E. M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>The pomegranate (<italic>Punica granatum</italic> L.) genome and the genomics of punicalagin biosynthesis.</article-title> <source><italic>Plant J.</italic></source> <volume>9</volume> <fpage>1108</fpage>&#x2013;<lpage>1128</lpage>. <pub-id pub-id-type="doi">10.1111/tpj.13625</pub-id> <pub-id pub-id-type="pmid">28654223</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quinlan</surname> <given-names>A. R.</given-names></name></person-group> (<year>2010</year>). <article-title>Hall. BEDTools: a flexible suite of utilities for comparing genomic features.</article-title> <source><italic>Bioinformatics</italic></source> <volume>26</volume> <fpage>841</fpage>&#x2013;<lpage>842</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq033</pub-id> <pub-id pub-id-type="pmid">20110278</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saminathan</surname> <given-names>T.</given-names></name> <name><surname>Bodunrin</surname> <given-names>A.</given-names></name> <name><surname>Singh</surname> <given-names>N. V.</given-names></name> <name><surname>Devarajan</surname> <given-names>R.</given-names></name> <name><surname>Nimmakayala</surname> <given-names>P.</given-names></name> <name><surname>Jeff</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Genome-wide identification of microRNAs in pomegranate (<italic>Punica granatum</italic> L.) by high-throughput sequencing.</article-title> <source><italic>BMC Plant Biol.</italic></source> <volume>16</volume>:<issue>122</issue>. <pub-id pub-id-type="doi">10.1186/s12870-016-0807-3</pub-id> <pub-id pub-id-type="pmid">27230657</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seppey</surname> <given-names>M.</given-names></name> <name><surname>Manni</surname> <given-names>M.</given-names></name> <name><surname>Zdobnov</surname> <given-names>E. V.</given-names></name></person-group> (<year>2019</year>). <article-title>BUSCO: assessing Genome Assembly and Annotation Completeness.</article-title> <source><italic>Methods Mol. Biol.</italic></source> <volume>1962</volume> <fpage>227</fpage>&#x2013;<lpage>245</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-9173-0_14</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simao</surname> <given-names>A. F.</given-names></name> <name><surname>Waterhouse</surname> <given-names>R. M.</given-names></name> <name><surname>Ioannidis</surname> <given-names>P.</given-names></name> <name><surname>Kriventseva</surname> <given-names>E. V.</given-names></name> <name><surname>Zdobnov</surname> <given-names>E. M.</given-names></name></person-group> (<year>2015</year>). <article-title>BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>3210</fpage>&#x2013;<lpage>3212</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv351</pub-id> <pub-id pub-id-type="pmid">26059717</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>N. K.</given-names></name> <name><surname>Gupta</surname> <given-names>D. K.</given-names></name> <name><surname>Jayaswal</surname> <given-names>P. K.</given-names></name> <name><surname>Mahato</surname> <given-names>A. K.</given-names></name> <name><surname>Dutta</surname> <given-names>S.</given-names></name> <name><surname>Singh</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>The first draft of the pigeon pea genome sequence.</article-title> <source><italic>J. Plant Biochem. Biotechnol.</italic></source> <volume>21</volume> <fpage>98</fpage>&#x2013;<lpage>112</lpage>. <pub-id pub-id-type="doi">10.1007/s13562-011-0088-8</pub-id> <pub-id pub-id-type="pmid">24431589</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Singh</surname> <given-names>N. V.</given-names></name> <name><surname>Patil</surname> <given-names>P. G.</given-names></name> <name><surname>Sowjanya</surname> <given-names>R. P.</given-names></name> <name><surname>Parashuram</surname> <given-names>S.</given-names></name> <name><surname>Natarajan</surname> <given-names>P.</given-names></name> <name><surname>Babu</surname> <given-names>K. D.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Chloroplast Genome Sequencing, Comparative Analysis, and Discovery of Unique Cytoplasmic Variants in Pomegranate (<italic>Punica granatum</italic> L.).</article-title> <source><italic>Front. Genet.</italic></source> <volume>12</volume>:<issue>704075</issue>.</citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smit</surname> <given-names>H. A.</given-names></name> <name><surname>Robinson</surname> <given-names>T. J.</given-names></name> <name><surname>Watson</surname> <given-names>J.</given-names></name> <name><surname>Vuuren</surname> <given-names>J. A.</given-names></name></person-group> (<year>2008</year>). <article-title>New Species of Elephant-shrew (<italic>Afrotheria</italic>: <italic>Macroscelidea</italic>: <italic>Elephantulus</italic>) from South Africa.</article-title> <source><italic>J. Mammal.</italic></source> <volume>89</volume> <fpage>1257</fpage>&#x2013;<lpage>1268</lpage>.</citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Tzvetkova</surname> <given-names>A.</given-names></name> <name><surname>Morgenstern</surname> <given-names>B.</given-names></name></person-group> (<year>2006</year>). <article-title>Augustus at EGASP prediction of alternative transcripts.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>34</volume> <fpage>W435</fpage>&#x2013;<lpage>W439</lpage>. <pub-id pub-id-type="doi">10.1186/gb-2006-7-s1-s11</pub-id> <pub-id pub-id-type="pmid">16925833</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stankova</surname> <given-names>H.</given-names></name> <name><surname>Hastie</surname> <given-names>A. R.</given-names></name> <name><surname>Chan</surname> <given-names>S.</given-names></name> <name><surname>Vr&#x00E1;na</surname> <given-names>J.</given-names></name> <name><surname>Tulpov&#x00E1;</surname> <given-names>Z.</given-names></name> <name><surname>Kubal&#x00E1;kov&#x00E1;</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>BioNano genome mapping of individual chromosomes supports physical mapping and sequence assembly in complex plant genomes.</article-title> <source><italic>Plant Biotech. J.</italic></source> <volume>14</volume> <fpage>1523</fpage>&#x2013;<lpage>1531</lpage>.</citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sunkar</surname> <given-names>R.</given-names></name> <name><surname>Chinnusamy</surname> <given-names>V.</given-names></name> <name><surname>Zhu</surname> <given-names>J.</given-names></name> <name><surname>Zhu</surname> <given-names>J. K.</given-names></name></person-group> (<year>2007</year>). <article-title>Small RNAs as big players in plant abiotic stress responses and nutrient deprivation.</article-title> <source><italic>Trends Plant Sci.</italic></source> <volume>12</volume> <fpage>301</fpage>&#x2013;<lpage>309</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2007.05.001</pub-id> <pub-id pub-id-type="pmid">17573231</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tarailo-Graovac</surname> <given-names>M.</given-names></name> <name><surname>Nansheng</surname> <given-names>C.</given-names></name></person-group> (<year>2009</year>). <article-title>Using RepeatMasker to identify repetitive elements in genomic sequences.</article-title> <source><italic>Curr. Protoc. Bioinform.</italic></source> <volume>25</volume> <fpage>4</fpage>&#x2013;<lpage>10</lpage>.</citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Treangen</surname> <given-names>T. J.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Repetitive DNA and next-generation sequencing: computational challenges and solutions.</article-title> <source><italic>Nat. Rev. Genet.</italic></source> <volume>13</volume> <fpage>36</fpage>&#x2013;<lpage>46</lpage>.</citation></ref>
<ref id="B57"><citation citation-type="journal"><collab>UniProt Consortium</collab> (<year>2014</year>). <article-title>UniProt: a hub for protein information.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>D204</fpage>&#x2013;<lpage>12</lpage>.</citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Nguyen</surname> <given-names>Ho</given-names></name> <name><surname>Dominique</surname> <given-names>L.</given-names></name></person-group> (<year>2009</year>). <article-title>PLAST: parallel local alignment search tool for database comparison.</article-title> <source><italic>BMC Bioinform.</italic></source> <volume>10</volume>:<issue>329</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-10-329</pub-id> <pub-id pub-id-type="pmid">19821978</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vurture</surname> <given-names>G. W.</given-names></name> <name><surname>Sedlazeck</surname> <given-names>F. J.</given-names></name> <name><surname>Nattestad</surname> <given-names>M.</given-names></name> <name><surname>Underwood</surname> <given-names>C. J.</given-names></name> <name><surname>Han Fang Gurtowski</surname> <given-names>J.</given-names></name> <name><surname>Schatz</surname> <given-names>M. C.</given-names></name></person-group> (<year>2017</year>). <article-title>GenomeScope: fast reference-free genome profiling from short reads.</article-title> <source><italic>Bioinformatics</italic></source> <volume>33</volume> <fpage>2202</fpage>&#x2013;<lpage>2204</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx153</pub-id> <pub-id pub-id-type="pmid">28369201</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Walker</surname> <given-names>B. J.</given-names></name> <name><surname>Abeel</surname> <given-names>T.</given-names></name> <name><surname>Shea</surname> <given-names>T.</given-names></name> <name><surname>Priest</surname> <given-names>M.</given-names></name> <name><surname>Abouelliel</surname> <given-names>A.</given-names></name> <name><surname>Sakthikumar</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Pilon: an integrated tool for comprehensive microbial variant detection and genome assembly improvement.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e112963</issue>.</citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Coleman-Derr</surname> <given-names>D.</given-names></name> <name><surname>Chen</surname> <given-names>G.</given-names></name> <name><surname>Gu</surname> <given-names>Y. Q.</given-names></name></person-group> (<year>2015</year>). <article-title>OrthoVenn: a web server for genome wide comparison and annotation of orthologous clusters across multiple species.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>W78</fpage>&#x2013;<lpage>W84</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv487</pub-id> <pub-id pub-id-type="pmid">25964301</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>Z.</given-names></name> <name><surname>Wang</surname> <given-names>H.</given-names></name></person-group> (<year>2007</year>). <article-title>LTR FINDER: an efficient tool for the prediction of full-length LTR retrotransposons.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>35</volume> <fpage>W265</fpage>&#x2013;<lpage>W268</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkm286</pub-id> <pub-id pub-id-type="pmid">17485477</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>J.</given-names></name> <name><surname>Levitin</surname> <given-names>H. M.</given-names></name> <name><surname>Frattini</surname> <given-names>V.</given-names></name> <name><surname>Bush</surname> <given-names>E. C.</given-names></name> <name><surname>Boyett</surname> <given-names>D. M.</given-names></name> <name><surname>Samanamud</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Single-cell transcriptome analysis of lineage diversity in high-grade glioma.</article-title> <source><italic>Genome Med.</italic></source> <volume>10</volume>:<issue>57</issue>.</citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>Z.</given-names></name> <name><surname>Fang</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>T.</given-names></name> <name><surname>Fei</surname> <given-names>Z.</given-names></name> <name><surname>Han</surname> <given-names>F.</given-names></name> <name><surname>Liu</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>The pomegranate (<italic>Punica granatum</italic> L.) genome provides insights into fruit quality and ovule developmental biology.</article-title> <source><italic>Plant Biotech. J.</italic></source> <volume>16</volume> <fpage>1363</fpage>&#x2013;<lpage>1374</lpage>. <pub-id pub-id-type="doi">10.1111/pbi.12875</pub-id> <pub-id pub-id-type="pmid">29271050</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Hu</surname> <given-names>J.</given-names></name> <name><surname>Han</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Gao</surname> <given-names>Y.</given-names></name> <name><surname>Richards</surname> <given-names>C. M.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>A high-quality apple genome assembly reveals the association of a retrotransposon and red fruit colour.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>10</volume>:<issue>1494</issue>. <pub-id pub-id-type="doi">10.1038/s41467-019-09518-x</pub-id> <pub-id pub-id-type="pmid">30940818</pub-id></citation></ref>
</ref-list>
</back>
</article>