<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="data-paper">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2020.00172</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Data Report</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Novel Full-Length Transcriptome Resource for Black Tiger Shrimp (<italic>Penaeus monodon</italic>) Developed Using Isoform Sequencing (Iso-Seq)</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Pootakham</surname> <given-names>Wirulda</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/211002/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Uengwetwanit</surname> <given-names>Tanaporn</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/912732/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sonthirod</surname> <given-names>Chutima</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Sittikankaew</surname> <given-names>Kanchana</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Karoonuthaisiri</surname> <given-names>Nitsara</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>National Omics Center, National Center for Genetic Engineering and Biotechnology (BIOTEC), National Science and Technology Development Agency</institution>, <addr-line>Pathum Thani</addr-line>, <country>Thailand</country></aff>
<aff id="aff2"><sup>2</sup><institution>National Center for Genetic Engineering and Biotechnology (BIOTEC), National Science and Technology Development Agency</institution>, <addr-line>Pathum Thani</addr-line>, <country>Thailand</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Pei-Yuan Qian, Hong Kong University of Science and Technology, Hong Kong</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Ka Yan Ma, The Chinese University of Hong Kong, China; Marta Gomez-Chiarri, University of Rhode Island, United States; Adam Michael Reitzel, University of North Carolina at Charlotte, United States</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Nitsara Karoonuthaisiri <email>nitsara&#x00040;alumni.stanford.edu</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Marine Molecular Biology and Ecology, a section of the journal Frontiers in Marine Science</p></fn>
<fn fn-type="other" id="fn002"><p>&#x02020;These authors have contributed equally to this work</p></fn></author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>03</month>
<year>2020</year>
</pub-date>
<pub-date pub-type="collection">
<year>2020</year>
</pub-date>
<volume>7</volume>
<elocation-id>172</elocation-id>
<history>
<date date-type="received">
<day>22</day>
<month>01</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>05</day>
<month>03</month>
<year>2020</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2020 Pootakham, Uengwetwanit, Sonthirod, Sittikankaew and Karoonuthaisiri.</copyright-statement>
<copyright-year>2020</copyright-year>
<copyright-holder>Pootakham, Uengwetwanit, Sonthirod, Sittikankaew and Karoonuthaisiri</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<kwd-group>
<kwd>black tiger shrimp</kwd>
<kwd><italic>Penaeus monodon</italic></kwd>
<kwd>transcriptome</kwd>
<kwd>Iso-seq</kwd>
<kwd>PacBio sequencing</kwd>
</kwd-group>
<contract-num rid="cn001">P-16-51718</contract-num>
<contract-num rid="cn001">P-18-51724</contract-num>
<contract-num rid="cn001">P-19-50419</contract-num>
<contract-num rid="cn002">734486</contract-num>
<contract-sponsor id="cn001">National Science and Technology Development Agency<named-content content-type="fundref-id">10.13039/501100004192</named-content></contract-sponsor>
<contract-sponsor id="cn002">H2020 Marie Sk&#x00142;odowska-Curie Actions<named-content content-type="fundref-id">10.13039/100010665</named-content></contract-sponsor>
<counts>
<fig-count count="1"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="25"/>
<page-count count="5"/>
<word-count count="3099"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Background</title>
<p>The black tiger shrimp, <italic>Penaeus monodon</italic>, is one of the major cultured penaeid shrimp species, contributing 9% of total crustacean production (FAO, <xref ref-type="bibr" rid="B3">2018</xref>). With its economic and nutritional importance, extensive research and development programs have been initiated to gain better understanding of various biological processes in black tiger shrimp and to apply this basic knowledge to improve farming practices and advance selective breeding programs with an ultimate goal of sustainable shrimp farming industry. Although several transcriptome studies in shrimp have been performed using expressed sequence tags (ESTs) (Lehnert et al., <xref ref-type="bibr" rid="B10">1999</xref>; Supungul et al., <xref ref-type="bibr" rid="B15">2002</xref>; Tassanakajon et al., <xref ref-type="bibr" rid="B17">2006</xref>), microarray technology (Karoonuthaisiri et al., <xref ref-type="bibr" rid="B7">2009</xref>; Wongsurawat et al., <xref ref-type="bibr" rid="B22">2010</xref>; Leelatanawit et al., <xref ref-type="bibr" rid="B9">2011</xref>; Uawisetwathana et al., <xref ref-type="bibr" rid="B19">2011</xref>), and second-generation sequencing (SGS) technologies (Rotllant et al., <xref ref-type="bibr" rid="B13">2015</xref>; Nguyen et al., <xref ref-type="bibr" rid="B12">2016</xref>; Huerlimann et al., <xref ref-type="bibr" rid="B6">2018</xref>; Uengwetwanit et al., <xref ref-type="bibr" rid="B20">2018</xref>), the efforts were significantly impeded by the lack of high-quality reference genome assembly in this organism. It is also extremely challenging to obtain a complete, full-length transcriptome assembly from short-read RNA sequencing (RNAseq) data given the high contents of repetitive elements, which have been estimated to be 46.68&#x02013;51.18% (Huang et al., <xref ref-type="bibr" rid="B5">2011</xref>; Yuan et al., <xref ref-type="bibr" rid="B25">2018</xref>).</p>
<p>In this study, we applied long-read Pacific Biosciences (PacBio) isoform sequencing (Iso-seq) to generate the first full-length transcriptome assembly for black tiger shrimp. Full-length mRNA sequences from nine major organs and hemocytes were obtained using PacBio&#x00027;s circular consensus sequencing (CCS) technology. PacBio sequencing platform enables full-length transcripts from their 5&#x02032; ends to poly(A) tails to be captured in single long reads, making this an ideal approach for constructing a reference transcriptome assembly without reference genome sequences (Dong et al., <xref ref-type="bibr" rid="B1">2015</xref>; Kuo et al., <xref ref-type="bibr" rid="B8">2017</xref>; Workman et al., <xref ref-type="bibr" rid="B23">2018</xref>). The ability to capture full-length transcripts also facilitates the discovery of novel isoforms and alternative transcripts that vary with developmental stages (Thatcher et al., <xref ref-type="bibr" rid="B18">2016</xref>), cell types (Swarup et al., <xref ref-type="bibr" rid="B16">2016</xref>) and stress conditions (Yan et al., <xref ref-type="bibr" rid="B24">2012</xref>; Liu et al., <xref ref-type="bibr" rid="B11">2016</xref>). Without a high-quality genome sequence draft, we believe that this high-quality reference transcriptome assembly will be a valuable resource for transcriptome profiling studies under various conditions in black tiger shrimp.</p></sec>
<sec id="s2">
<title>Data Description</title>
<sec>
<title>Sample Collection</title>
<p>A total of nine organs and hemocytes were harvested from two male and two female 4-month-old juvenile black tiger shrimps (Yui Gung Oog, Prachuap Khiri Khan, Thailand). The shrimps were specific pathogen free: they were tested for White Spot Syndrome Virus (WSSV), Yellowhead disease, Taura Syndrome (TS) virus and acute hepatopancreatic necrosis disease (AHPND). All tissue samples (except ovary and testis) were pooled from four individuals while the ovary and testis tissues were pooled from two individuals. This study was performed in accordance with the recommendations of Animal Research Ethics Guidelines, and the protocol was approved by the National Center of Genetic Engineering and Biotechnology Animal Research Ethics Committee (approval number BT-IACUC-RF01-10-01). The following organs were dissected and immediately frozen in liquid nitrogen: gill, heart, hepatopancreas, intestine, ovary, pleopod, stomach, testis and thoracic ganglia. Haemolymph was centrifuged at 3,000 rpm at 4&#x000B0;C for 5 min to pellet the hemocytes, which were then frozen in liquid nitrogen. All samples were stored at &#x02212;80&#x000B0;C until RNA extraction.</p></sec>
<sec>
<title>RNA Extraction and PacBio Sequencing</title>
<p>Total RNA was extracted from the frozen tissues using TRI REAGENT according to the manufacturer&#x00027;s instruction (Molecular Research Center, USA). Contaminated genomic DNA was removed by DNase I treatment at 0.5 U/&#x003BC;g total RNA at 37&#x000B0;C for 30 min (Promega, USA). One ug of DNase-treated RNA sample from each tissue was used for cDNA synthesis. SMRTbell library construction was carried out using the SMRTbell Template Prep Kit 1.0-SPv3 protocol, following the manufacturer&#x00027;s instruction (Pacific Biosciences, Menlo Park, USA). Barcodes were used to keep track of the tissue origin of the samples. The libraries were run on the PacBio Sequel System using the sequencing chemistry version 3.0 and 10-h movie times (the sequencing was outsourced to NovogenAIT, Singapore and Macrogen, Korea).</p></sec>
<sec>
<title>Transcriptome Assembly and Annotation</title>
<p>SMRTlink version 6.0 (Pacific Biosciences, Menlo Park, CA, USA) was used to filter and process raw subreads, using the Iso-seq3 pipeline to obtain highly accurate long reads. Subreads shorter than 50 nt (default parameter) or with the ReadScore lower than 0.8 were removed prior to generating the circular consensus sequence (CCS) reads using the following parameters: minPasses = 1 and minPredictedAccuracy = 0.9. Full-length non-chimeric (FLNC) or non full-length (NFL) reads were classified based on the presence or absence of 5&#x02032; primer, 3&#x02032; primer and the poly(A) tail. FLNC reads were clustered using the Iso-seq3 cluster module in the SMRTlink to generate consensus sequences, which were subsequently polished with the Arrow software (<ext-link ext-link-type="uri" xlink:href="https://www.pacb.com/wp-content/uploads/SMRT_Tools_Reference_Guide_v600.pdf">https://www.pacb.com/wp-content/uploads/SMRT_Tools_Reference_Guide_v600.pdf</ext-link>) using NFL reads. We obtained a total of 1,604,098 reads of insert (from all tissues combined), ranging from 50 to 14,973 nt with an average read length of 2,942 and an N50 of 3,242 nt. Of those reads of insert, 82,441 were high-quality FLNC transcripts (<xref ref-type="table" rid="T1">Table 1</xref>). To exclude contaminating sequences from other organisms, we aligned FLNC transcripts to virus, bacteria, fungi and human sequences (from the NCBI RefSeq database release number 97) using BLASTN and identified 22 FLNC transcripts that exhibited over 90% identity to those sequences with at least 90% sequence coverage. Those were removed prior to downstream analyses. We subsequently used CPAT version 1.2.4 (Wang et al., <xref ref-type="bibr" rid="B21">2013</xref>) to filter out 5,627 long non-coding RNA (lncRNA) and clustered the remaining transcript sequences at 99% identity using UCLUST (Edgar, <xref ref-type="bibr" rid="B2">2010</xref>) to obtain a set of 22,418 non-redundant sequences in the final transcriptome assembly. Compared to our full-length transcriptome assembly, the previously reported assembly derived from Illumina short reads contained a greater number of transcripts (236,085 sequences; TRA: GGLH00000000) with considerably shorter average read length (956 nt) and N50 length (1,431 nt) (Huerlimann et al., <xref ref-type="bibr" rid="B6">2018</xref>).</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Assembly statistics for <italic>P. monodon</italic> transcriptome.</p></caption>
<table frame="hsides" rules="groups">
<tbody>
<tr>
<td valign="top" align="left"><bold>PacBio Iso-seq</bold></td>
<td/>
</tr>
<tr>
<td valign="top" align="left">Number of bases sequenced (nt)</td>
<td valign="top" align="center">93,918,510,812</td>
</tr>
<tr>
<td valign="top" align="left">Number of reads of insert</td>
<td valign="top" align="center">1,640,098</td>
</tr>
<tr>
<td valign="top" align="left">Mean read of insert length (nt)</td>
<td valign="top" align="center">2,942</td>
</tr>
<tr>
<td valign="top" align="left">Median read of insert length (nt)</td>
<td valign="top" align="center">2,675</td>
</tr>
<tr>
<td valign="top" align="left">Read of insert N90 (nt)</td>
<td valign="top" align="center">1,897</td>
</tr>
<tr>
<td valign="top" align="left">Read of insert N50 (nt)</td>
<td valign="top" align="center">3,242</td>
</tr>
<tr>
<td valign="top" align="left">Read of insert N20 (nt)</td>
<td valign="top" align="center">4,938</td>
</tr>
<tr>
<td valign="top" align="left">Maximum read of insert length (nt)</td>
<td valign="top" align="center">14,973</td>
</tr>
<tr>
<td valign="top" align="left">Number of filtered high-quality FLNC reads</td>
<td valign="top" align="center">82,419</td>
</tr>
<tr>
<td valign="top" align="left">Mean GC content</td>
<td valign="top" align="center">43.92</td>
</tr>
<tr>
<td valign="top" align="left">Total assembled bases (nt)</td>
<td valign="top" align="center">4,826,359,993</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Transcriptome annotation</bold></td>
<td/>
</tr>
<tr>
<td valign="top" align="left">% of transcripts annotated</td>
<td valign="top" align="center">94.12</td>
</tr>
<tr>
<td valign="top" align="left">% of transcripts with GO annotations</td>
<td valign="top" align="center">53.22</td>
</tr>
<tr>
<td valign="top" align="left">% of transcripts with KOG annotations</td>
<td valign="top" align="center">83.15</td>
</tr>
<tr>
<td valign="top" align="left"><bold>BUSCO</bold></td>
<td/>
</tr>
<tr>
<td valign="top" align="left">% complete</td>
<td valign="top" align="center">80.86</td>
</tr>
<tr>
<td valign="top" align="left">% partial</td>
<td valign="top" align="center">2.64</td>
</tr>
<tr>
<td valign="top" align="left">% missing</td>
<td valign="top" align="center">16.5</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The annotations of this reference assembly, including gene ontology (GO) and eukaryotic orthologous groups (KOG) assignments, were carried out using Blast2GO version 5.2 (G&#x000F6;tz et al., <xref ref-type="bibr" rid="B4">2008</xref>) (BioBam, Valencia, Spain; <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 1</xref>). Approximately 94% of sequences in the assembly were annotated, and 53% and 83% had been assigned GO and KOG annotations, respectively (<xref ref-type="table" rid="T1">Table 1</xref>). The highest number of transcripts sequenced was affiliated with cellular metabolic process, organic substance metabolic process, primary metabolic process and nitrogen compound metabolic process (<xref ref-type="fig" rid="F1">Figure 1A</xref>). We also investigated the completeness of the transcriptome assembly by assessing the coverage of the benchmarking universal single-copy orthologs (BUSCO) using the eukaryotic gene set (Sim&#x000E3;o et al., <xref ref-type="bibr" rid="B14">2015</xref>). Of the 429 conserved eukaryotic genes, 80.86% were identified as &#x0201C;complete&#x0201D; in the assembly and an additional 2.64% were partially assembled. Our assembly had a much higher proportion of &#x0201C;missing&#x0201D; orthologs (16.5%) compared to the assembly reported by Huerlimann et al. (<xref ref-type="bibr" rid="B6">2018</xref>), which was 98% complete based on BUSCO analysis. The fact that our shrimp samples were from a single stage (4-month old) while those used in Huerlimann et al. (<xref ref-type="bibr" rid="B6">2018</xref>) were from multiple stages and that some of the tissues sequenced in Huerlimann et al. (<xref ref-type="bibr" rid="B6">2018</xref>) were not included in our study could attribute to the missing orthologs in the BUSCO assessment. Most of the conserved orthologs that were missing in our assembly were those involved in the DNA replication processes.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Gene annotation and transcript distribution. <bold>(A)</bold> Distribution of functional categories based on GO terms in <italic>P. monodon</italic> transcriptome assembly. <bold>(B)</bold> Distribution of transcripts in each tissue type based on their presence in the tissues studied. Tissue-specific transcripts (orange bar) are present in only one tissue type; ubiquitous transcripts (blue bar) are present in all tissue types, and common transcripts (green bar) are present in more than one tissue type but not detected in all tissues examined. The number represents the percentage of each transcript category in each tissue type.</p></caption>
<graphic xlink:href="fmars-07-00172-g0001.tif"/>
</fig>
<p>RNA samples from nine different tissue types and hemocytes were sequenced to generate the reference transcriptome assembly. We kept track of the origin of individual full-length transcript sequence and classified each of them as follows: &#x0201C;tissue-specific&#x0201D; when it is present in only one tissue type, &#x0201C;ubiquitous&#x0201D; when it is present in all tissue types investigated and &#x0201C;common&#x0201D; when it is present in between two to nine tissue types studied. Of the 22,418 non-redundant transcript sequences in the assembly, 462 transcripts were present in all tissues examined (<xref ref-type="supplementary-material" rid="SM1">Supplementary Table 2</xref>). The number of non-redundant transcripts detected in each tissue type is displayed in <xref ref-type="fig" rid="F1">Figure 1B</xref> and <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 2</xref>. Hepatopancreas (26.7%) and testis (26.0%) tissues had the highest proportions of tissue-specific transcripts while heart tissues had the lowest proportion of tissue-specific transcripts (11.1%; <xref ref-type="fig" rid="F1">Figure 1B</xref> and <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 2</xref>). Interestingly, between 54 and 65% of the transcripts detected in each individual tissue type were also present in the stomach. On contrary, only 17-30% of the transcripts detected in each individual tissue type were also present in either hepatopancreas or ovary tissues (<xref ref-type="supplementary-material" rid="SM1">Supplementary Table 2</xref>).</p>
<p>The ability to capture full-length transcripts using Iso-seq technology provided a unique opportunity to detect alternative splicing events in different tissue types. To identify candidate transcripts with multiple isoforms, we examined clusters of FLNC transcripts containing sequences of multiple lengths. Examples of transcripts with different isoforms are shown in <xref ref-type="supplementary-material" rid="SM2">Supplementary Figure 1</xref>. A transcript annotated as T-cell immunomodulatory protein had two alternative 5&#x02032; splice sites and displayed a hemocyte-specific isoform with a truncated 3&#x02032; end, which likely represented an exon-skipping event. Another example was the thoracic ganglia-specific isoform (annotated as protein lines-like) appeared to skip an exon near the 5&#x02032; end of the transcript. Complementary information from genome sequences is required to map the exon-intron junctions and determine if the alternative splicing events observed are exon skipping or intron retention. PacBio technology eliminates the need to assemble transcripts from short-read data and allows (long) full-length transcripts to be sequenced in single-molecule reads, providing direct evidence for alternatively spliced isoforms.</p></sec>
<sec>
<title>Re-use Potential</title>
<p>This study reports the first full-length transcriptome assembly for <italic>P. mondon</italic>, utilizing PacBio long-read single molecule real-time (SMRT) sequencing technology to obtain full-length transcript sequences. Future transcriptome profiling studies and genome sequencing projects in <italic>P. monodon</italic> and closely related species will greatly benefit from the full-length Iso-seq based transcriptome assembly reported here and the previously reported Illumina-based transcriptome assembly.</p></sec></sec>
<sec sec-type="data-availability-statement" id="s3">
<title>Data Availability Statement</title>
<p>The transcriptome assembly is available from NCBI GenBank database under BioProject ID PRJNA602748, and the transcriptome annotations are provided in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 1</xref>.</p></sec>
<sec id="s4">
<title>Author Contributions</title>
<p>NK, TU, and WP conceived and designed the experiment. KS collected shrimp samples and carried out the RNA extraction. CS and TU performed bioinformatics analyses. WP and NK wrote the manuscript. All authors read and approved the final manuscript.</p>
<sec>
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
</sec>
</body>
<back>
<sec sec-type="supplementary-material" id="s5">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2020.00172/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2020.00172/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_1.JPEG" id="SM2" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dong</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name> <name><surname>Kong</surname> <given-names>G.</given-names></name> <name><surname>Chu</surname> <given-names>J. S. C.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Single-molecule real-time transcript sequencing facilitates common wheat genome annotation and grain transcriptome research</article-title>. <source>BMC Genomics</source> <volume>16</volume>:<fpage>1039</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-015-2257-y</pub-id><pub-id pub-id-type="pmid">26645802</pub-id></citation></ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Edgar</surname> <given-names>R. C.</given-names></name></person-group> (<year>2010</year>). <article-title>Search and clustering orders of magnitude faster than BLAST</article-title>. <source>Bioinformatics</source> <volume>26</volume>, <fpage>2460</fpage>&#x02013;<lpage>2461</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq461</pub-id><pub-id pub-id-type="pmid">20709691</pub-id></citation></ref>
<ref id="B3">
<citation citation-type="book"><person-group person-group-type="author"><collab>FAO</collab></person-group> (<year>2018</year>). <source>The State of Fisheries and Aquaqulture 2018. Meeting the Sustainable Development Goals</source>. <publisher-loc>Rome</publisher-loc>: <publisher-name>FAO</publisher-name>.</citation></ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>G&#x000F6;tz</surname> <given-names>S.</given-names></name> <name><surname>Garc&#x000ED;a-G&#x000F3;mez</surname> <given-names>J. M.</given-names></name> <name><surname>Terol</surname> <given-names>J.</given-names></name> <name><surname>Williams</surname> <given-names>T. D.</given-names></name> <name><surname>Nagaraj</surname> <given-names>S. H.</given-names></name> <name><surname>Nueda</surname> <given-names>M. J.</given-names></name> <etal/></person-group>. (<year>2008</year>). <article-title>High-throughput functional annotation and data mining with the Blast2GO suite</article-title>. <source>Nucleic Acids Res.</source> <volume>36</volume>, <fpage>3420</fpage>&#x02013;<lpage>3435</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkn176</pub-id><pub-id pub-id-type="pmid">18445632</pub-id></citation></ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>S.-W.</given-names></name> <name><surname>Lin</surname> <given-names>Y.-Y.</given-names></name> <name><surname>You</surname> <given-names>E.-M.</given-names></name> <name><surname>Liu</surname> <given-names>T.-T.</given-names></name> <name><surname>Shu</surname> <given-names>H.-Y.</given-names></name> <name><surname>Wu</surname> <given-names>K.-M.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Fosmid library end sequencing reveals a rarely known genome structure of marine shrimp <italic>Penaeus monodon</italic></article-title>. <source>BMC Genomics</source> <volume>12</volume>:<fpage>242</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-12-242</pub-id><pub-id pub-id-type="pmid">21575266</pub-id></citation></ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huerlimann</surname> <given-names>R.</given-names></name> <name><surname>Wade</surname> <given-names>N. M.</given-names></name> <name><surname>Gordon</surname> <given-names>L.</given-names></name> <name><surname>Montenegro</surname> <given-names>J. D.</given-names></name> <name><surname>Goodall</surname> <given-names>J.</given-names></name> <name><surname>Mcwilliam</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>De novo assembly, characterization, functional annotation and expression patterns of the black tiger shrimp (<italic>Penaeus monodon</italic>) transcriptome</article-title>. <source>Sci. Rep.</source> <volume>8</volume>:<fpage>13553</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-31148-4</pub-id><pub-id pub-id-type="pmid">30202061</pub-id></citation></ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Karoonuthaisiri</surname> <given-names>N.</given-names></name> <name><surname>Sittikankeaw</surname> <given-names>K.</given-names></name> <name><surname>Preechaphol</surname> <given-names>R.</given-names></name> <name><surname>Kalachikov</surname> <given-names>S.</given-names></name> <name><surname>Wongsurawat</surname> <given-names>T.</given-names></name> <name><surname>Uawisetwathana</surname> <given-names>U.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>ReproArray(GTS): a cDNA microarray for identification of reproduction-related genes in the giant tiger shrimp Penaeus monodon and characterization of a novel nuclear autoantigenic sperm protein (NASP) gene</article-title>. <source>Comp. Biochem. Physiol. Part D Genomics Proteomics</source> <volume>4</volume>, <fpage>90</fpage>&#x02013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.1016/j.cbd.2008.11.003</pub-id><pub-id pub-id-type="pmid">20403739</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kuo</surname> <given-names>R. I.</given-names></name> <name><surname>Tseng</surname> <given-names>E.</given-names></name> <name><surname>Eory</surname> <given-names>L.</given-names></name> <name><surname>Paton</surname> <given-names>I. R.</given-names></name> <name><surname>Archibald</surname> <given-names>A. L.</given-names></name> <name><surname>Burt</surname> <given-names>D. W.</given-names></name></person-group> (<year>2017</year>). <article-title>Normalized long read RNA sequencing in chicken reveals transcriptome complexity similar to human</article-title>. <source>BMC Genomics</source> <volume>18</volume>:<fpage>323</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-017-3691-9</pub-id><pub-id pub-id-type="pmid">28438136</pub-id></citation></ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leelatanawit</surname> <given-names>R.</given-names></name> <name><surname>Uawisetwathana</surname> <given-names>U.</given-names></name> <name><surname>Klinbunga</surname> <given-names>S.</given-names></name> <name><surname>Karoonuthaisiri</surname> <given-names>N.</given-names></name></person-group> (<year>2011</year>). <article-title>A cDNA microarray, UniShrimpChip, for identification of genes relevant to testicular development in the black tiger shrimp (<italic>Penaeus monodon</italic>)</article-title>. <source>BMC Mol. Biol</source>. <volume>12</volume>:<fpage>15</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2199-12-15</pub-id><pub-id pub-id-type="pmid">21486443</pub-id></citation></ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lehnert</surname> <given-names>S. A.</given-names></name> <name><surname>Wilson</surname> <given-names>K. J.</given-names></name> <name><surname>Byrne</surname> <given-names>K.</given-names></name> <name><surname>Moore</surname> <given-names>S. S.</given-names></name></person-group> (<year>1999</year>). <article-title>Tissue-specific expressed sequence tags from the black tiger shrimp <italic>Penaeus monodon</italic></article-title>. <source>Mar. Biotechnol.</source> <volume>1</volume>, <fpage>465</fpage>&#x02013;<lpage>0476</lpage>. <pub-id pub-id-type="doi">10.1007/PL00011803</pub-id><pub-id pub-id-type="pmid">10525681</pub-id></citation></ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Liang</surname> <given-names>X.</given-names></name> <name><surname>Zhou</surname> <given-names>X.</given-names></name> <name><surname>Yang</surname> <given-names>F.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Alternative splicing of rice WRKY62 and WRKY76 transcription factor genes in pathogen defense</article-title>. <source>Plant Physiol.</source> <volume>171</volume>, <fpage>1427</fpage>&#x02013;<lpage>1442</lpage>. <pub-id pub-id-type="doi">10.1104/pp.15.01921</pub-id><pub-id pub-id-type="pmid">27208272</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nguyen</surname> <given-names>C.</given-names></name> <name><surname>Nguyen</surname> <given-names>T. G.</given-names></name> <name><surname>Nguyen</surname> <given-names>L. V.</given-names></name> <name><surname>Pham</surname> <given-names>H. Q.</given-names></name> <name><surname>Nguyen</surname> <given-names>T. H.</given-names></name> <name><surname>Pham</surname> <given-names>H. T.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>De novo assembly and transcriptome characterization of major growth-related genes in various tissues of <italic>Penaeus monodon</italic></article-title>. <source>Aquaculture</source> <volume>464</volume>, <fpage>545</fpage>&#x02013;<lpage>553</lpage>. <pub-id pub-id-type="doi">10.1016/j.aquaculture.2016.08.003</pub-id></citation></ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rotllant</surname> <given-names>G.</given-names></name> <name><surname>Wade</surname> <given-names>N. M.</given-names></name> <name><surname>Arnold</surname> <given-names>S. J.</given-names></name> <name><surname>Coman</surname> <given-names>G. J.</given-names></name> <name><surname>Preston</surname> <given-names>N. P.</given-names></name> <name><surname>Glencross</surname> <given-names>B. D.</given-names></name></person-group> (<year>2015</year>). <article-title>Identification of genes involved in reproduction and lipid pathway metabolism in wild and domesticated shrimps</article-title>. <source>Mar. Genomics</source> <volume>22</volume>, <fpage>55</fpage>&#x02013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.1016/j.margen.2015.04.001</pub-id><pub-id pub-id-type="pmid">25890100</pub-id></citation></ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sim&#x000E3;o</surname> <given-names>F. A.</given-names></name> <name><surname>Waterhouse</surname> <given-names>R. M.</given-names></name> <name><surname>Ioannidis</surname> <given-names>P.</given-names></name> <name><surname>Kriventseva</surname> <given-names>E. V.</given-names></name> <name><surname>Zdobnov</surname> <given-names>E. M.</given-names></name></person-group> (<year>2015</year>). <article-title>BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs</article-title>. <source>Bioinformatics</source> <volume>31</volume>, <fpage>3210</fpage>&#x02013;<lpage>3212</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv351</pub-id><pub-id pub-id-type="pmid">26059717</pub-id></citation></ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Supungul</surname> <given-names>P.</given-names></name> <name><surname>Klinbunga</surname> <given-names>S.</given-names></name> <name><surname>Pichyangkura</surname> <given-names>R.</given-names></name> <name><surname>Jitrapakdee</surname> <given-names>S.</given-names></name> <name><surname>Hirono</surname> <given-names>I.</given-names></name> <name><surname>Aoki</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2002</year>). <article-title>Identification of immune-related genes in hemocytes of black tiger shrimp (<italic>Penaeus monodon</italic>)</article-title>. <source>Mar. Biotechnol.</source> <volume>4</volume>, <fpage>487</fpage>&#x02013;<lpage>494</lpage>. <pub-id pub-id-type="doi">10.1007/s10126-002-0043-8</pub-id><pub-id pub-id-type="pmid">14961242</pub-id></citation></ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Swarup</surname> <given-names>R.</given-names></name> <name><surname>Crespi</surname> <given-names>M.</given-names></name> <name><surname>Bennett</surname> <given-names>M. J.</given-names></name></person-group> (<year>2016</year>). <article-title>One gene, many proteins: mapping cell-specific alternative splicing in plants</article-title>. <source>Dev. Cell</source> <volume>39</volume>, <fpage>383</fpage>&#x02013;<lpage>385</lpage>. <pub-id pub-id-type="doi">10.1016/j.devcel.2016.11.002</pub-id><pub-id pub-id-type="pmid">27875679</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tassanakajon</surname> <given-names>A.</given-names></name> <name><surname>Klinbunga</surname> <given-names>S.</given-names></name> <name><surname>Paunglarp</surname> <given-names>N.</given-names></name> <name><surname>Rimphanitchayakit</surname> <given-names>V.</given-names></name> <name><surname>Udomkit</surname> <given-names>A.</given-names></name> <name><surname>Jitrapakdee</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2006</year>). <article-title>Penaeus monodon gene discovery project: the generation of an EST collection and establishment of a database</article-title>. <source>Gene</source> <volume>384</volume>, <fpage>104</fpage>&#x02013;<lpage>112</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2006.07.012</pub-id><pub-id pub-id-type="pmid">16945489</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Thatcher</surname> <given-names>S. R.</given-names></name> <name><surname>Danilevskaya</surname> <given-names>O. N.</given-names></name> <name><surname>Meng</surname> <given-names>X.</given-names></name> <name><surname>Beatty</surname> <given-names>M.</given-names></name> <name><surname>Zastrow-Hayes</surname> <given-names>G.</given-names></name> <name><surname>Harris</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Genome-wide analysis of alternative splicing during development and drought stress in maize</article-title>. <source>Plant Physiol.</source> <volume>170</volume>, <fpage>586</fpage>&#x02013;<lpage>599</lpage>. <pub-id pub-id-type="doi">10.1104/pp.15.01267</pub-id><pub-id pub-id-type="pmid">26582726</pub-id></citation></ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Uawisetwathana</surname> <given-names>U.</given-names></name> <name><surname>Leelatanawit</surname> <given-names>R.</given-names></name> <name><surname>Klanchui</surname> <given-names>A.</given-names></name> <name><surname>Prommoon</surname> <given-names>J.</given-names></name> <name><surname>Klinbunga</surname> <given-names>S.</given-names></name> <name><surname>Karoonuthaisiri</surname> <given-names>N.</given-names></name></person-group> (<year>2011</year>). <article-title>Insights into eyestalk ablation mechanism to induce ovarian maturation in the black tiger shrimp</article-title>. <source>PLoS ONE</source> <volume>6</volume>:<fpage>e24427</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0024427</pub-id><pub-id pub-id-type="pmid">21915325</pub-id></citation></ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Uengwetwanit</surname> <given-names>T.</given-names></name> <name><surname>Ponza</surname> <given-names>P.</given-names></name> <name><surname>Sangsrakru</surname> <given-names>D.</given-names></name> <name><surname>Wichadakul</surname> <given-names>D.</given-names></name> <name><surname>Ingsriswang</surname> <given-names>S.</given-names></name> <name><surname>Leelatanawit</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Transcriptome-based discovery of pathways and genes related to reproduction of the black tiger shrimp (<italic>Penaeus monodon</italic>)</article-title>. <source>Mar. Genomics</source> <volume>37</volume>, <fpage>69</fpage>&#x02013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1016/j.margen.2017.08.007</pub-id><pub-id pub-id-type="pmid">28899645</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Park</surname> <given-names>H. J.</given-names></name> <name><surname>Dasari</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Kocher</surname> <given-names>J. P.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name></person-group> (<year>2013</year>). <article-title>CPAT: Coding-Potential Assessment Tool using an alignment-free logistic regression model</article-title>. <source>Nucleic Acids Res.</source> <volume>41</volume>:<fpage>e74</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt006</pub-id><pub-id pub-id-type="pmid">23335781</pub-id></citation></ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wongsurawat</surname> <given-names>T.</given-names></name> <name><surname>Leelatanawit</surname> <given-names>R.</given-names></name> <name><surname>Thamniemdee</surname> <given-names>N.</given-names></name> <name><surname>Uawisetwathana</surname> <given-names>U.</given-names></name> <name><surname>Karoonuthaisiri</surname> <given-names>N.</given-names></name> <name><surname>Menasveta</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Identification of testis-relevant genes using <italic>in silico</italic> analysis from testis ESTs and cDNA microarray in the black tiger shrimp (<italic>Penaeus monodon</italic>)</article-title>. <source>BMC Mol. Biol</source>. <volume>11</volume>:<fpage>55</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2199-11-55</pub-id><pub-id pub-id-type="pmid">20696033</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Workman</surname> <given-names>R. E.</given-names></name> <name><surname>Myrka</surname> <given-names>A. M.</given-names></name> <name><surname>Wong</surname> <given-names>G. W.</given-names></name> <name><surname>Tseng</surname> <given-names>E.</given-names></name> <name><surname>Welch</surname> <given-names>K. C.</given-names> <suffix>Jr.</suffix></name> <name><surname>Timp</surname> <given-names>W.</given-names></name></person-group> (<year>2018</year>). <article-title>Single-molecule, full-length transcript sequencing provides insight into the extreme metabolism of the ruby-throated hummingbird <italic>Archilochus colubris</italic></article-title>. <source>GigaScience</source> <volume>7</volume>:<fpage>giy009</fpage>. <pub-id pub-id-type="doi">10.1093/gigascience/giy009</pub-id><pub-id pub-id-type="pmid">29618047</pub-id></citation></ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yan</surname> <given-names>K.</given-names></name> <name><surname>Liu</surname> <given-names>P.</given-names></name> <name><surname>Wu</surname> <given-names>C.-A.</given-names></name> <name><surname>Yang</surname> <given-names>G.-D.</given-names></name> <name><surname>Xu</surname> <given-names>R.</given-names></name> <name><surname>Guo</surname> <given-names>Q.-H.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>Stress-induced alternative splicing provides a mechanism for the regulation of microRNA processing in <italic>Arabidopsis thaliana</italic></article-title>. <source>Mol. Cell</source> <volume>48</volume>, <fpage>521</fpage>&#x02013;<lpage>531</lpage>. <pub-id pub-id-type="doi">10.1016/j.molcel.2012.08.032</pub-id><pub-id pub-id-type="pmid">23063528</pub-id></citation></ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Liu</surname> <given-names>C.</given-names></name> <name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Wei</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Genomic resources and comparative analyses of two economical penaeid shrimp species, <italic>Marsupenaeus japonicus</italic> and <italic>Penaeus monodon</italic></article-title>. <source>Mar. Genomics</source> <volume>39</volume>, <fpage>22</fpage>&#x02013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1016/j.margen.2017.12.006</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn fn-type="financial-disclosure"><p><bold>Funding.</bold> This work was supported by the National Center for Genetic Engineering and Biotechnology (RI grant number P1851724 and Platform grant number P1651718), National Science and Technology Development Agency (grant number P1950419), and partially supported by the European Union&#x00027;s Horizon 2020 research and innovation program under the Marie Sk&#x00142;odowska-Curie grant agreement no. 734486.</p>
</fn>
</fn-group>
</back>
</article>