<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="data-paper">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fgene.2021.739781</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Data Report</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Chromosome-Scale Genome Assembly and Transcriptome Assembly of Kawakawa <italic>Euthynnus affinis</italic>; A Tuna-Like Species</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Havelka</surname> <given-names>Milo&#x00161;</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1401651/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sawayama</surname> <given-names>Eitaro</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1433716/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Saito</surname> <given-names>Taiju</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yoshitake</surname> <given-names>Kazutoshi</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Saka</surname> <given-names>Daiki</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ineno</surname> <given-names>Toshinao</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1443907/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Asakawa</surname> <given-names>Shuichi</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1448114/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Takagi</surname> <given-names>Motohiro</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Goto</surname> <given-names>Rie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Matsubara</surname> <given-names>Takahiro</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>South Ehime Fisheries Research Center, Ehime University</institution>, <addr-line>Ainan</addr-line>, <country>Japan</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Marine Science and Resources, College of Bioresource Sciences, Nihon University</institution>, <addr-line>Fujisawa</addr-line>, <country>Japan</country></aff>
<aff id="aff3"><sup>3</sup><institution>Laboratory of Aquatic Molecular Biology and Biotechnology, Graduate School of Agricultural and Life Sciences, The University of Tokyo</institution>, <addr-line>Tokyo</addr-line>, <country>Japan</country></aff>
<aff id="aff4"><sup>4</sup><institution>Aquaculture Research Institute, Kindai University</institution>, <addr-line>Shingu</addr-line>, <country>Japan</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Joanna Szyda, Wroclaw University of Environmental and Life Sciences, Poland</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Xinhai Ye, Zhejiang University, China; Changxu Tian, Guangdong Ocean University, China</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Milo&#x00161; Havelka <email>miloshavelka&#x00040;seznam.cz</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Livestock Genomics, a section of the journal Frontiers in Genetics</p></fn></author-notes>
<pub-date pub-type="epub">
<day>20</day>
<month>09</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>12</volume>
<elocation-id>739781</elocation-id>
<history>
<date date-type="received">
<day>12</day>
<month>07</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>16</day>
<month>08</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2021 Havelka, Sawayama, Saito, Yoshitake, Saka, Ineno, Asakawa, Takagi, Goto and Matsubara.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Havelka, Sawayama, Saito, Yoshitake, Saka, Ineno, Asakawa, Takagi, Goto and Matsubara</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license></permissions>  
<kwd-group>
<kwd>aquaculture</kwd>
<kwd>comparative genomics</kwd>
<kwd>eastern little tuna</kwd>
<kwd>genome annotation</kwd>
<kwd>linkage map</kwd>
<kwd>Thunnini</kwd>
</kwd-group>
<contract-sponsor id="cn001">Ministry of Education, Culture, Sports, Science and Technology<named-content content-type="fundref-id">10.13039/501100001700</named-content></contract-sponsor>
<contract-sponsor id="cn002">National Agriculture and Food Research Organization<named-content content-type="fundref-id">10.13039/501100007172</named-content></contract-sponsor>
<counts>
<fig-count count="1"/>
<table-count count="1"/>
<equation-count count="0"/>
<ref-count count="75"/>
<page-count count="9"/>
<word-count count="7375"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Kawakawa <italic>Euthynnus affinis</italic>, also known as eastern little tuna or mackerel tuna, is a species of tuna (Thunnini tribe, subgroup Pelagiaria clade) (Sanciangco et al., <xref ref-type="bibr" rid="B54">2016</xref>). Tuna includes 15 species: eight of genus <italic>Thunnus</italic> (true tuna) and seven &#x0201C;tuna-like&#x0201D; of four genera: <italic>Allothunnus, Auxis, Euthynnus</italic>, and <italic>Katsuwonus</italic>.</p>
<p><italic>E. affinis</italic> is widely distributed throughout the tropical and subtropical waters of the continental shelf areas of the Indo-Pacific region (Collette, <xref ref-type="bibr" rid="B12">2001</xref>). The fish reaches a length of 45&#x02013;60 cm and matures at approximately 3 years of age. It inhabits almost exclusively the upper layers of the ocean (Bernal et al., <xref ref-type="bibr" rid="B4">2017</xref>) and feeds mainly on small pelagic fish (Griffiths et al., <xref ref-type="bibr" rid="B26">2009</xref>). <italic>E. affinis</italic> makes up a substantial proportion of the commercial and artisanal fishery in many countries of the Indo-Pacific region. The meat of <italic>E. affinis</italic> is of high quality (Mukundan et al., <xref ref-type="bibr" rid="B47">1979</xref>) with a comparatively high level of docosahexaenoic acid (Saito et al., <xref ref-type="bibr" rid="B53">1999</xref>), but deteriorates rapidly if not properly handled (Mukundan et al., <xref ref-type="bibr" rid="B47">1979</xref>). <italic>E. affinis</italic> exhibits the swimming mechanics of true tunas (Donley and Dickson, <xref ref-type="bibr" rid="B19">2000</xref>) but has no swim bladder and differs from true tunas in red muscle distribution, allometry, and vascular anatomy (Bernal et al., <xref ref-type="bibr" rid="B4">2017</xref>). The ability to maintain an elevated temperature in eye, brain, and red muscle has been suggested for the genus <italic>Euthynnus</italic> (Dickson et al., <xref ref-type="bibr" rid="B18">2000</xref>), but reports specific to <italic>E. affinis</italic> are lacking.</p>
<p>Compared to true tunas, <italic>E. affinis</italic> has received scant attention from researchers, and little is known about its biology and physiology. This is likely to change, as <italic>E. affinis</italic> has recently become of interest in marine aquaculture. <italic>E. affinis</italic> is the second tuna species whose full-life cycle culture in captivity has been developed so far, including spawning, egg collection, incubation, larval rearing, and grow-out to marketable size (Yazawa et al., <xref ref-type="bibr" rid="B71">2015</xref>, <xref ref-type="bibr" rid="B72">2016</xref>).</p>
<p>Aquaculture in general is currently facing significant challenges to increasing production while maintaining sustainability (Bridson et al., <xref ref-type="bibr" rid="B5">2020</xref>). Genetic improvement, <italic>via</italic> selective breeding and genetic engineering, is a major focus of research and can yield rapid benefits to efficient production in fish farming (Lu and Luo, <xref ref-type="bibr" rid="B45">2020</xref>). To these ends, a high-quality species genome assembly is critical. Despite recent advances in sequencing technologies and genomics that, in addition to basic fish science (Lien et al., <xref ref-type="bibr" rid="B44">2016</xref>; Hughes et al., <xref ref-type="bibr" rid="B33">2018</xref>; Yuan et al., <xref ref-type="bibr" rid="B75">2018</xref>; Du et al., <xref ref-type="bibr" rid="B20">2020</xref>), have applications to aquaculture practices (Lu and Luo, <xref ref-type="bibr" rid="B45">2020</xref>) and fisheries (Benestan, <xref ref-type="bibr" rid="B3">2020</xref>), genomic information of tuna species is limited. To date, the genomes of only three tuna species are available in the public repositories, none of which are assembled to chromosome level. This situation exists within the entire Pelagiaria clade that, along with tuna, includes the economically important mackerel (Scombrini tribe) and bonito (Sardini tribe).</p>
<p>Here, we report the chromosome-level genome assembly of kawakawa <italic>E. affinis</italic> (NCBI:txid8227). To our knowledge, this is the first available chromosome-level assembly within the Pelagiaria clade. The reported genome assembly is accompanied by transcriptome assembly, genetic linkage map, annotation of transposons, repetitive elements, and 23,059 genes. The dataset provides a solid genome resource not only for further study of <italic>E. affinis</italic> basic biology and genome-scale selective breeding but also for enhancing both basic and applied research within the Pelagiaria clade.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and Methods</title>
<sec>
<title>Genome Sequencing and Assembly</title>
<p>The tissue sample was obtained from a single wild <italic>E. affinis</italic> female caught off the coast of Ainan, Ehime Prefecture, Japan. High-molecular-weight genomic DNA was isolated from fin using NucleoBond<sup>&#x000AE;</sup> AXG columns with NucleoBond<sup>&#x000AE;</sup> Buffer Set IV (Macherey-Nagel, D&#x000FC;ren, Germany). The quantification of gDNA was performed by Quant-iT&#x02122; dsDNA Broad-Range Assay Kit (<italic>Invitrogen</italic>, Carlsbad, CA, USA), and molecular weight was estimated on 0.75% agarose gel by pulsed-field electrophoresis. The whole-genome sequencing library was prepared using Chromium Genome Library &#x00026; Gel Bead Kit v. 2 (10x Genomics, Pleasanton, CA, USA) as described in the Chromium Genome Reagent Kit v. 2 User Guide. The library was sequenced on Illumina HiSeq X sequencing system using pair-end (2 &#x000D7; 150 bp) sequencing. The sequencing generated 920.3 million (M) reads of total 138.04 Gb with 93.8% and 87.7% of base having quality score Q &#x0003E; 30 in R1 and R2 reads, respectively.</p>
<p>Oxford Nanopore Technology (ONT) sequencing was used to obtain long reads for scaffolding. Libraries were generated using standard protocols from ONT with the SQK-LSK108 ligation sequencing kit (Oxford Nanopore Technologies, Oxford, United Kingdom). GridION X5 sequencing was performed according to the manufacturer&#x00027;s guidelines using three independent FLO-MIN107 (R9.5) flow cells. Base-calling was done by Albacore v. 1.2.4. (Oxford Nanopore Technologies, Oxford, United Kingdom). Raw reads were filtered by quality value QV9 (--minqual 9), and heads and tails were 50 bp trimmed each (--headtrim 50; --tailtrim50) in Yanagiba v. 1.0.0 (Taranto, <xref ref-type="bibr" rid="B63">2017</xref>). The ONT sequencing generated 1.56 M reads with a total of 15.02 Gb, an average length of 9,650 bp, and N50 = 18,747 bp.</p>
<p>Prior to genome assembly, genome characteristics were estimated based on Illumina reads. Jellyfish v. 2.2.6 (Mar&#x000E7;ais and Kingsford, <xref ref-type="bibr" rid="B46">2011</xref>) was applied to generate k-mer counting and frequency distributions of 19-, 21-, and 23-mers. Genome size, heterozygosity, and repeat content were estimated based on the generated k-mer count distributions using GenomeScope (Vurture et al., <xref ref-type="bibr" rid="B66">2017</xref>) with high frequency k-mer cutoff = 10,000. The estimate in GenomeScope is based on an equation that models four evenly spaced negative binomial distributions of the k-mer profile to measure the relative abundances of heterozygous and homozygous, unique, and two-copy sequences (Vurture et al., <xref ref-type="bibr" rid="B66">2017</xref>). The genome size estimate ranged from 745.82 Mb (<italic>k</italic> = 19) to 755.80 Mb (<italic>k</italic> = 23), heterozygosity rate was roughly estimated to be 0.67% (67 SNPs per 10 Kb), and repeat content estimate ranged from 137.00 Mb (<italic>k</italic> = 23) to 170.35 (<italic>k</italic> = 19; <xref ref-type="supplementary-material" rid="SM7">Supplementary Table 1</xref>).</p>
<p>Assembly of Illumina reads was performed in Supernova assembler v. 1.1.5 (10x Genomics, Pleasanton, CA, USA), with default parameters, except maximum reads (--maxreads), set at 386 M input reads to achieve 56 &#x000D7; raw coverage, as suggested in the Supernova protocol. Assembled scaffolds were loaded together with filtered ONT reads into PBJelly v. 15.8.24 (English et al., <xref ref-type="bibr" rid="B22">2012</xref>) where identification of gaps &#x0003E;25 bp, gap filling, and scaffolding were performed using default parameters. In total, 11.31 Mb of gaps (34.8% of initial gap size) were successfully closed. The 787.60-Mb initial draft genome assembly was presented in pseudohaplotype format and consisted of 19,850 scaffold sequences (&#x0003E;1 Kb), of which 21.17 Mb (2.69%) represented unknown bases.</p>
<p>The redundancy of the genome assembly was reduced in three steps: First, 8,191 duplicated scaffolds (24.24 Mb) were removed using dedupe.sh from BBTools v. 38.87 (Bushnell, <xref ref-type="bibr" rid="B6">2014</xref>). Furthermore, scaffolds &#x0003C; 2 Mb were clustered in CD-HIT v. 4.8.1 (Li and Godzik, <xref ref-type="bibr" rid="B43">2006</xref>) with identity threshold &#x02265; 99% (-c 0.99) and word size -n 10. This step removed 1,044 scaffolds (5.1 Mb). Finally, retained scaffolds were self-aligned in LastZ v. 1.04 (Harris, <xref ref-type="bibr" rid="B29">2007</xref>) with alignment identity threshold &#x02265; 99% (--identity = 99) and query coverage threshold &#x02265; 95% (--coverage = 95). If two different scaffolds were self-aligned, the longer one was retained and the shorter one was discarded. In total, 9,250 scaffolds (29.4 Mb; 3.7%) were removed from the initial assembly because of potential duplication or redundancy. The final scaffold-level assembly consisted of 10,600 scaf-folds of 758.20 Mb (19.89 Mb gaps), N50 = 24.78 Mb, and the longest scaffold = 35.13 Mb.</p>
</sec>
<sec>
<title>Linkage Mapping and Chromosome-Level Scaffolding</title>
<p>We obtained two types of linkage evidence: diploid, based on full-sib family linkage analyses, and haploid, based on linkage analyses of interspecific hybrids (Yoshitake et al., <xref ref-type="bibr" rid="B73">2018</xref>) of <italic>E. affinis</italic> female and <italic>T. orientalis</italic> male. Based on a genome coordinate of each marker in the linkage maps, we anchored and oriented scaffolds into pseudochromosomes.</p>
<p>To construct a diploid linkage map, DNA was extracted from fin clips of parents and 94 of their progeny using NucleoSpin<sup>&#x000AE;</sup> Tissue (Macherey-Nagel, D&#x000FC;ren, Germany). All specimens were assessed for body weight, standard length, head length, and body depth (<xref ref-type="supplementary-material" rid="SM8">Supplementary Table 2</xref>). Genotyping by random amplicon sequencing-direct (GRAS-Di<sup>&#x000AE;</sup>) libraries of each specimen were prepared according to the protocol of Hosoya et al. (<xref ref-type="bibr" rid="B32">2019</xref>). The final PCR products were pooled, purified using the MiniElute PCR Purification Kit (Qiagen, Hilden, Germany), and applied for pair-end (2 &#x000D7; 76 bp) sequencing on the Illumina NextSeq 500. Library preparation and sequencing were done by Bioengineering Lab. Co., Ltd., under a license agreement, as GRAS-Di<sup>&#x000AE;</sup> is patented by the Toyota Motor Corporation (Aichi, Japan) (patent ID P2018-42548A). The sequencing generated &#x0007E;160 M (12.17 Gb) raw reads. These were trimmed in TrimGalore v. 0.6.4 (Krueger, <xref ref-type="bibr" rid="B39">2019</xref>) to remove residues of indexes, nucleotides with quality &#x02264; Q20, and reads &#x02264; 20 bp after trimming. In total, 64.81 M reads in pairs (675,154 reads per sample on average) with a total length of 9.67 Gb (100.72 Mb per sample on average) were retained after trimming (<xref ref-type="supplementary-material" rid="SM8">Supplementary Table 2</xref>). Trimmed reads of each sample were mapped onto reference assembly using Bowtie2 v. 2.4 (Langmead and Salzberg, <xref ref-type="bibr" rid="B41">2012</xref>) allowing no mismatches in the read seed (-N 0). The overall mapping rate was 92.2% with 74.9% of reads mapped only once (<xref ref-type="supplementary-material" rid="SM8">Supplementary Table 2</xref>). Sorted BAM files were created using samtools v. 1.10 (Danecek et al., <xref ref-type="bibr" rid="B16">2021</xref>). Variants were called in bcftools v. 1.10.2 (Danecek et al., <xref ref-type="bibr" rid="B16">2021</xref>) by <italic>mpileup</italic> and <italic>call</italic> commands using multiallelic-caller and variants-only flags (-mv). Filtering of SNPs was performed in vcftools v. 0.1.16 (Danecek et al., <xref ref-type="bibr" rid="B15">2011</xref>) removing indels (--remove-indels), SNPs with quality &#x02264; 30 (--minQ 30), SNPs not in HWE (--hwe 0.05), and genotypes with depth &#x02264; 10 (--minDP 10). Minor allele frequency was set to 0.05 (--maf 0.05), retaining 5,853 SNPs of 368,265 raw variants. Genotypes were phased, and both female and male linkage maps were constructed in TMap v. 1.1 (Cartwright et al., <xref ref-type="bibr" rid="B10">2007</xref>). All segregating markers that showed polymorphism in at least one parent were used. The ratio of marker segregation was calculated by chi-squared test. Markers showing significantly distorted segregation (<italic>p</italic>-value &#x0003C; 0.001) were excluded from the map construction. A minimum logarithm of odds (LOD) threshold of 5.0 was selected to assign markers to 24 linkage groups. Recombination rates were calculated by the multipoint-likelihood maximization, and map distances were converted by Kosambi mapping function. A total of 852 of 1,332 polymorphic loci were assigned to 24 linkage groups covering a total length of 1,554.7 cM of the <italic>E. affinis</italic> genome (<xref ref-type="supplementary-material" rid="SM3">Supplementary File 1</xref>).</p>
<p>To obtain haploid linkage evidence, interspecific hybrids of <italic>E. affinis</italic> and <italic>T. orientalis</italic> were produced. Briefly, eggs of a single <italic>E. affinis</italic> female were mixed with cryopreserved sperm of <italic>T. orientalis</italic> provided by the Aquaculture Research Institute, Kindai University, Japan. Seawater was immediately added to activate gametes and induce fertilization. After 1&#x02013;2 h, eggs with proceeding cleavage were selected and transferred to the hatching tank at 24&#x000B0;C. After 36&#x02013;40 h, 202 individuals that hatched or died after reaching somite formation were separately transferred to a 1.5-ml tube and stored in 100% ethanol. DNA was extracted from parents and F1 hybrids using a NucleoSpin Tissue XS kit (Macherey-Nagel, D&#x000FC;ren, Germany). A sequencing library was prepared from 135 specimens, which provided sufficient DNA for use of the Nextera DNA Library Preparation Kit and Nextera Index Kit (Illumina) following the manufacturer&#x00027;s protocols. The library was sequenced on two lines of Illumina HiSeq X sequencing system. The sequencing resulted in 2,274 M sequencing reads with a total of 342 Gb. Reads were mapped onto a reference obtained by combining <italic>E. affinis</italic> scaffold-level assembly and <italic>T. orientalis</italic> genome (Suda et al., <xref ref-type="bibr" rid="B61">2019</xref>) using BWA mem v. 0.7.15 (Li and Durbin, <xref ref-type="bibr" rid="B42">2009</xref>). Mapped reads were sorted in samtools v. 1.10 (Danecek et al., <xref ref-type="bibr" rid="B16">2021</xref>), and variants were called in bcftools v. 1.10.2 (Danecek et al., <xref ref-type="bibr" rid="B16">2021</xref>) by <italic>mpileup</italic> and <italic>call</italic> commands. Linkage evidence of scaffolds was obtained through linkage analysis of hybrids in SELDLA v. 2.0.9 (Yoshitake et al., <xref ref-type="bibr" rid="B73">2018</xref>) using 13,403,357 SNPs specific to <italic>E. affinis</italic>.</p>
<p>Female and male linkage maps and scaffold linkage evidence were transformed to BED files and merged. Pseudochromosomes were then reconstructed using ALLMAPS v. 1.1.7 from the JCVI utility libraries v. 0.7.5 (Tang et al., <xref ref-type="bibr" rid="B62">2015</xref>) with inter-scaffold gaps set to a fixed size of 100 Ns. The package was used to merge bad files and to anchor, order, and orient genomic scaffolds using default parameters. Overall, 387 scaffolds with total length of 685.79 Mb (90.7% of scaffold-level assembly) were anchored onto 24 pseudochromosomes leaving 10,213 scaffolds of total length 72.42 Mb unplaced. Only two unplaced scaffolds had length &#x0003E; 1 Mb (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1</xref>). The final assembly contained 10,237 scaffolds of 758.24 Mb (19.96 Mb gaps), N50 = 29.18 Mb, and longest scaffold = 35.73 Mb (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Descriptive statistics of kawakawa <italic>Euthynnus affinis</italic> genome assembly, transcriptome assembly, repetitive DNA annotation, gene prediction, and functional annotation with completeness assessment results.</p></caption>
<table frame="hsides" rules="groups">
<tbody>
<tr>
<td valign="top" align="left" colspan="2"><bold>Genome assembly</bold></td>
</tr>
<tr>
<td valign="top" align="left">Number of sequences</td>
<td valign="top" align="center">10,237</td>
</tr>
<tr>
<td valign="top" align="left">Total length (bp)</td>
<td valign="top" align="center">758,243,246</td>
</tr>
<tr>
<td valign="top" align="left">N50 (bp)</td>
<td valign="top" align="center">29,176,746</td>
</tr>
<tr>
<td valign="top" align="left">Max scaffold length (bp)</td>
<td valign="top" align="center">35,734,308</td>
</tr>
<tr>
<td valign="top" align="left">GC content (%)</td>
<td valign="top" align="center">39.78</td>
</tr>
<tr>
<td valign="top" align="left">Gaps (bp)</td>
<td valign="top" align="center">19,960,513</td>
</tr>
<tr>
<td valign="top" align="left">BUSCO (%)</td>
<td valign="top" align="center">C = 97.1; S = 96.1; D = 1.0; F = 1.0; M = 1.9</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2"><bold>Transcriptome assembly</bold></td>
</tr>
<tr>
<td valign="top" align="left">Number of sequences</td>
<td valign="top" align="center">49,510</td>
</tr>
<tr>
<td valign="top" align="left">Total length (bp)</td>
<td valign="top" align="center">94,582,375</td>
</tr>
<tr>
<td valign="top" align="left">N50 (bp)</td>
<td valign="top" align="center">3,622</td>
</tr>
<tr>
<td valign="top" align="left">Max contig length (bp)</td>
<td valign="top" align="center">56,879</td>
</tr>
<tr>
<td valign="top" align="left">BUSCO (%)</td>
<td valign="top" align="center">C = 91.7; S = 90.3; D = 1.4; F = 1.3; M = 7.0</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2"><bold>Repeat annotation</bold></td>
</tr>
<tr>
<td valign="top" align="left">SINEs (bp)</td>
<td valign="top" align="center">1,061,850 (0.14%)</td>
</tr>
<tr>
<td valign="top" align="left">LINEs (bp)</td>
<td valign="top" align="center">22,627,927 (2.98%)</td>
</tr>
<tr>
<td valign="top" align="left">LTR elements (bp)</td>
<td valign="top" align="center">6,260,411 (0.83%)</td>
</tr>
<tr>
<td valign="top" align="left">DNA transposons (bp)</td>
<td valign="top" align="center">44,033,659 (5.81%)</td>
</tr>
<tr>
<td valign="top" align="left">Small RNA (bp)</td>
<td valign="top" align="center">570,727 (0.08%)</td>
</tr>
<tr>
<td valign="top" align="left">Satellites (bp)</td>
<td valign="top" align="center">101,725 (0.01%)</td>
</tr>
<tr>
<td valign="top" align="left">Simple repeats (bp)</td>
<td valign="top" align="center">19,817,678 (2.61%)</td>
</tr>
<tr>
<td valign="top" align="left">Low complexity (bp)</td>
<td valign="top" align="center">3,166,036 (0.42%)</td>
</tr>
<tr>
<td valign="top" align="left">Unclassified (bp)</td>
<td valign="top" align="center">94,139,074 (12.42%)</td>
</tr>
<tr>
<td valign="top" align="left">Total (bp)</td>
<td valign="top" align="center">194,013,215 (25.59%)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="2"><bold>Gene annotation</bold></td>
</tr>
<tr>
<td valign="top" align="left">Number of predicted genes</td>
<td valign="top" align="center">23,059</td>
</tr>
<tr>
<td valign="top" align="left">Mean length (bp)</td>
<td/>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Gene</td>
<td valign="top" align="center">10,511</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Exon</td>
<td valign="top" align="center">244</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Intron</td>
<td valign="top" align="center">939</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;CDS</td>
<td valign="top" align="center">1,592</td>
</tr>
<tr>
<td valign="top" align="left">Mean exon per gene</td>
<td valign="top" align="center">10</td>
</tr>
<tr>
<td valign="top" align="left">% of genome covered by genes</td>
<td valign="top" align="center">32.0</td>
</tr>
<tr>
<td valign="top" align="left">% of genome covered by CDS</td>
<td valign="top" align="center">4.8</td>
</tr>
<tr>
<td valign="top" align="left">BUSCO</td>
<td valign="top" align="center">C = 89.1; S = 87.8; D = 1.3; F = 3.4; M = 7.5</td>
</tr>
<tr>
<td valign="top" align="left">Functionally annotated total</td>
<td valign="top" align="center">21,313 (92.4%)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Swissport</td>
<td valign="top" align="center">19,750 (85.6%)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;trEMBL</td>
<td valign="top" align="center">21,310 (92.4%)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;NCBI NR</td>
<td valign="top" align="center">21,077 (91.4%)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;InterPro</td>
<td valign="top" align="center">17,718 (76.8%)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>BUSCO = benchmarking universal single copy orthologs; C = complete; S = complete and single copy; D = complete and duplicated; F = fragmented; M = missing; LINEs = long interspersed nuclear elements; LTR = long terminal repeat; SINEs = short interspersed nuclear elements</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>mRNA Sequencing and Transcriptome Assembly</title>
<p>Total RNA was extracted from eight tissues (brain, liver, kidney, ovary, testis, spleen, gill, muscle, and intestine) using TRIzol (<italic>Invitrogen</italic>, Carlsbad, CA, USA) and the NucleoSpin<sup>&#x000AE;</sup> RNA Plus extraction kit (Macherey-Nagel, D&#x000FC;ren, Germany) following the manufacturer&#x00027;s protocols for each tissue. RNA extracts were quantified using a NanoPhotometer N50 (Implen, M&#x000FC;nchen, Germany) and subsequently combined in equimolar quantities into a single pool for sequencing. RNA sequencing library was prepared by MGIEasy RNA Directional Library Prep Set (MGI Tech Co Ltd.). Pair-end (2 &#x000D7; 150 bp) sequencing was performed on a DNBSEQ-G400 sequencer (MGI Tech Co Ltd.). All procedures were conducted according to the manufacturer&#x00027;s protocols. The sequencing generated &#x0007E;682 M (102.53 Gb) raw reads. Quality metrics for sequencing reads were initially examined in FastQC v. 0.11.9. (Andrews, <xref ref-type="bibr" rid="B1">2020</xref>). Rare, possibly erroneous, k-mers were removed in Rcorrector v. 1.0.4 (Song and Florea, <xref ref-type="bibr" rid="B58">2015</xref>) with default parameters, and adapters and low-quality bases were trimmed in TrimGalore v. 0.6.4 (Krueger, <xref ref-type="bibr" rid="B39">2019</xref>) with parameters --length 36 -q 5 --stringency 3 -e 0.1 retaining &#x0007E;614 M (92.18 Gb) pair-end reads. The FastQC results revealed deviation from normal distribution of GC content, and a high number of overrepresented sequences, possibly due to incomplete polyA capture during library preparation. Thus, trimmed reads were mapped against ribosomal RNA (rRNA) sequence database SILVA release 128 (Quast et al., <xref ref-type="bibr" rid="B51">2012</xref>) using Bowtie2 v. 2.4 (Langmead and Salzberg, <xref ref-type="bibr" rid="B41">2012</xref>) with parameters --nofw --quiet -D 20 -R 3 -N 0 -L 20 -i S,1,0.50 to remove rRNA contaminants. The 359.6 M (53.9 Gb) reads that did not map (--un-conc-gz) to the SILVA database were processed for <italic>de novo</italic> assembly in Trinity v. 2.11.0 (Grabherr et al., <xref ref-type="bibr" rid="B25">2011</xref>) with default k-mer size 25 and --SS_lib_type RF --min_contig_length 300 flags. Initial transcriptome assembly resulted in 271,656 contigs of 242.43 Mb, N50 = 1.20 Kb. These were transferred to super transcripts (Davidson et al., <xref ref-type="bibr" rid="B17">2017</xref>) by Trinity&#x00027;s v. 2.11.0 Trinity_gene_splice_modeler.py, and further redundancy was reduced by Bellerophon pipeline v. 1.0 (Kerkvliet et al., <xref ref-type="bibr" rid="B37">2019</xref>), removing minimally expressed (transcripts per million cut off = 1) and highly identical (95%) contigs (CDHIT-EST -c 0.95). Final transcriptome assembly consisted of 49,510 contigs of 94.58 Mb, N50 = 3.62 Kb, with the longest contig = 56.88 Kb (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
</sec>
<sec>
<title>Repeat and Gene Annotation</title>
<p>A <italic>de novo</italic> repeat library was generated using RepeatModeler v. 2.0.1 (Flynn et al., <xref ref-type="bibr" rid="B23">2020</xref>) and MITE Tracker v. 1.0.0 (Crescente et al., <xref ref-type="bibr" rid="B14">2018</xref>) with default parameters. The genome was then screened for repeats and low complexity regions by RepeatMasker v. 4.1.1 (Smit et al., <xref ref-type="bibr" rid="B57">2015</xref>) in two runs using (i) <italic>de novo</italic>-generated repeat library and (ii) a Dfam database of interspersed repeats, release 3.3 (Storer et al., <xref ref-type="bibr" rid="B60">2021</xref>). Results of the runs were analyzed together to generate final non-redundant repeat annotation. Repetitive regions accounted for 25.59% (194.01 Mb) of genome assembly (<xref ref-type="fig" rid="F1">Figure 1A</xref>; <xref ref-type="table" rid="T1">Table 1</xref>). These included 12.42% unclassified repeats, 3.95% retrotransposons, 5.81% DNA transposons, 0.08% small RNAs, 0.01% satellites, 2.61% simple repeats, and 0.42% low complexity regions (<xref ref-type="supplementary-material" rid="SM4">Supplementary File 2</xref>).</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Characterization of the draft genome assembly of kawakawa <italic>Euthynnus affinis</italic>. <bold>(A)</bold> Summary of the genome annotation of kawakawa <italic>Euthynnus affinis</italic>. The tracks from inside to outside: GC content (%), negative-strand gene abundance (blue), positive-strand gene abundance (red), negative strand repetitive DNA abundance (green), positive-strand repetitive DNA abundance (orange), 24 pseudochromosomes (colors within each pseudochromosome denote different scaffolds). Window size = 1 Mb. <bold>(B)</bold> Chromosome level synteny between kawakawa <italic>Euthynnus affinis</italic> (right) and Japanese rice fish <italic>Oryzias latipes</italic> (left) based on 2,989 single-copy orthologs. <bold>(C)</bold> Number of orthogroups shared between each species pair of eight fish. <bold>(D)</bold> UpSet plot of intersections between orthogroups in different species. The bars show the number of common orthogroups for a given species or a group of species (dots connected by lines below the <italic>x</italic>-axis). In total, 10,586 orthogroups are common to all species, while 1,129 orthogroups are unique to <italic>E. affinis</italic> and <italic>T. orientalis</italic> (blue). <italic>Euthynnus affinis&#x02013;</italic>specific orthogroups (109) are shown in yellow. The species lacks 892 orthogroups found in all other species (red). Intersections with fewer than 100 orthogroups are not shown. <bold>(E)</bold> Orthogroup size and proportion of genes assigned to orthogroups per species. Yellow = number of genes; blue = number of genes in orthogroups; orange = number of orthogroups containing a given species; gray = number of unassigned genes.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fgene-12-739781-g0001.tif"/>
</fig>
<p>Gene models were predicted in MAKER v. 3.01.03 (Holt and Yandell, <xref ref-type="bibr" rid="B31">2011</xref>) in three successive runs. Prior to the first run, complex repeats were retrieved from the repeat annotation file and submitted to MAKER as pre-identified repeat elements (rm_gff) while still enabling the software to identify and soft mask simple repeats internally (Card, <xref ref-type="bibr" rid="B9">2017</xref>). In this approach, complex repeats are hard masked so that they do not confound the ability to identify coding genes, while simple repeats remain available for inclusion in gene annotations, as many protein-coding genes contain runs of low-complexity sequence (Toll-Riera et al., <xref ref-type="bibr" rid="B65">2011</xref>). During the first run, the <italic>E. affinis</italic> transcripts were aligned to the genome by BLASTN (Camacho et al., <xref ref-type="bibr" rid="B7">2009</xref>) and protein sequences of <italic>Danio rerio, Gasterosteus aculeatus, Hippocampus comes, Oreochromis niloticus, Oryzias latipes, Seriola dumerili, Sparus aurata</italic>, and <italic>Takifugu rubripes</italic> from the Ensembl database v. 103 (Yates et al., <xref ref-type="bibr" rid="B70">2019</xref>) along with <italic>Thunnus orientalis</italic> (Yasuike et al., <xref ref-type="bibr" rid="B69">2016</xref>) by BLASTX (Camacho et al., <xref ref-type="bibr" rid="B7">2009</xref>). Subsequently, BLAST hits were polished by Exonerate v. 2.4.7. (Slater and Birney, <xref ref-type="bibr" rid="B56">2005</xref>) est2genome and protein2genome. All filtering statistics for BLAST and Exonerate were as the default by MAKER. The second and third runs of MAKER utilized gene models from the first, followed by the second, runs to train <italic>ab initio</italic> gene prediction tools SNAP v. 2013-02-16 (Korf, <xref ref-type="bibr" rid="B38">2004</xref>) and Augustus v. 3.3.3. (Stanke and Waack, <xref ref-type="bibr" rid="B59">2003</xref>). This bootstrap process allows to iteratively improve the performance of <italic>ab initio</italic> gene predictors as they require existing gene models on which to base prediction parameters. SNAP was retrained using gene models with an annotation edit distance (Holt and Yandell, <xref ref-type="bibr" rid="B31">2011</xref>) (AED) &#x02264; 0.25 and amino acid length of &#x02265; 50. BUSCO v. 5.1.2 (Simao et al., <xref ref-type="bibr" rid="B55">2015</xref>) with --long argument and actinopterygii_obd10 lineage dataset was used to retrain Augustus using genomic regions of RNA annotations from the previous run including an additional 1,000 bp on each side as input file. Both SNAP and Augustus were run with default parameters specified in MAKER. Only gene models with AED &#x0003C;0.5 were retained in the final annotation set.</p>
<p>For functional annotation of predicted genes, predicted protein sequences were mapped against UniProtKB/Swiss-Prot (The UniProt Consortium, <xref ref-type="bibr" rid="B64">2021</xref>) and NCBI non-redundant (O&#x00027;Leary et al., <xref ref-type="bibr" rid="B50">2016</xref>) protein databases using BLASTP (Camacho et al., <xref ref-type="bibr" rid="B7">2009</xref>) with an e-value threshold of 1e&#x02212;6. Additionally, protein motifs, domains, and signatures were annotated using Interproscan v. 5.48 (Jones et al., <xref ref-type="bibr" rid="B34">2014</xref>), and Gene Ontology (GO) terms were obtained from the corresponding InterPro entry. Kyoto Encyclopedia of Genes and Genomes Orthologs (KOs) were assigned to predicted proteins using KofamKOALA (Aramaki et al., <xref ref-type="bibr" rid="B2">2019</xref>) with an e-value threshold of 1e&#x02212;3.</p>
<p>In total, 23,059 putative genes spanning 32.0% of the genome were predicted (<xref ref-type="fig" rid="F1">Figure 1A</xref>; <xref ref-type="table" rid="T1">Table 1</xref>). We found 21,313 (92.4%) predicted genes to match at least one of the databases (<xref ref-type="table" rid="T1">Table 1</xref>), and at least one GO and/or KO term was retrieved for 11,429 and 14,796 predicted genes, respectively.</p>
</sec>
</sec>
<sec id="s3">
<title>Data Validation</title>
<p>To validate the structural accuracy of the genome assembly and transcriptome assembly, Illumina and DNBSEQ pair-end sequencing reads were mapped back to the draft genome and transcriptome, respectively, using Bowtie2 v. 2.4 (Langmead and Salzberg, <xref ref-type="bibr" rid="B41">2012</xref>) with default parameters. A total of 98.59% of the Illumina reads mapped to the genome with 97.4% of bases being covered &#x0003E;5 times. Mapping rate of clean DNBSEQ reads mapped to the transcriptome was 91.14% with 93.77% of bases being covered &#x0003E;5 times.</p>
<p>Completeness of both assemblies was accessed by two approaches. First, a total of 227 (97.42%) and 230 (98.71%) core vertebrate genes (CVGs) from the complete set of 233 CVGs (Hara et al., <xref ref-type="bibr" rid="B28">2015</xref>) were identified in the genome and the transcriptome, respectively, by gVolante (Nishimura et al., <xref ref-type="bibr" rid="B49">2017</xref>). Then, BUSCO v. 5.1.2 (Simao et al., <xref ref-type="bibr" rid="B55">2015</xref>) was used to assess the presence of 3,640 actinopterygian single-copy orthologs (actinopterygii_odb10 lineage dataset) in both assemblies. In the genome, 3,534 (97.1%) single-copy orthologs were identified, of which 3,498 (96.1%) were complete and single copy. In the transcriptome, 3,338 (91.7%) single-copy orthologs were identified, of which 3,288 (90.3%) were complete and single copy (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<p>To verify the accuracy of the scaffold arrangement in 24 pseudochromosomes, the genomic locations of single-copy orthologs in <italic>E. affinis</italic> and <italic>O. latipes</italic> were compared and visualized in shinyCircos v. 1.0 (Yu et al., <xref ref-type="bibr" rid="B74">2018</xref>). Only unduplicated orthologs co-identified in both species by BUSCO v. 5.1.2 (Simao et al., <xref ref-type="bibr" rid="B55">2015</xref>) were used for comparison.</p>
<p>In summary, 2,561 of 2,989 single-copy orthologs were localized on the same chromosomes in both species (<xref ref-type="fig" rid="F1">Figure 1B</xref>), revealing the high consistency of their genomes. Based on this result, the first 24 scaffolds of <italic>E. affinis</italic> genome assembly were numbered in concordance with <italic>O. latipes</italic> chromosomes.</p>
<p>The predicted gene set was assessed for completeness by the method used for genome and transcriptome assembly. The predicted gene set contained 215 (92.3%) of 233 CVGs (Hara et al., <xref ref-type="bibr" rid="B28">2015</xref>) and 3,245 (89.1%) of 3,640 actinopterygian single-copy orthologs (<xref ref-type="table" rid="T1">Table 1</xref>). The predicted genes were clustered with those of seven fish species <italic>A. testudineus, D. rerio, G. aculeatus, H. comes, O. latipes, S. lalandi</italic>, and <italic>T. orientalis</italic> in OrthoFinder2 v. 2.3.8 (Emms and Kelly, <xref ref-type="bibr" rid="B21">2015</xref>) to identify orthologous groups, i.e., a set of genes descended from a single gene in the last common ancestor (Emms and Kelly, <xref ref-type="bibr" rid="B21">2015</xref>). The results were visualized in TBtools (Chen et al., <xref ref-type="bibr" rid="B11">2020</xref>) and ggplot2 (Wickham, <xref ref-type="bibr" rid="B67">2016</xref>).</p>
<p>In total, 181,780 of 192,254 genes from eight species were clustered into 21,003 orthogroups with 10,586 orthogroups being shared by all species (<xref ref-type="fig" rid="F1">Figure 1D</xref>). Of 23,059 predicted genes of <italic>E. affinis</italic>, 20,749 were assigned to 16,595 orthogroups (<xref ref-type="fig" rid="F1">Figures 1C,E</xref>) with 109 (311 genes) being unique to <italic>E. affinis</italic>. Species of the Thunnini tribe, <italic>E. affinis</italic> and <italic>T. orientalis</italic>, possessed 1,129 unique orthogroups (<xref ref-type="fig" rid="F1">Figure 1D</xref>). In contrast, 892 orthogroups not detected in <italic>E. affinis</italic> were identified in all other species. This suggests that, although the genes belonging to these orthogroups were not captured during gene annotation, they are likely present in the <italic>E. affinis</italic> genome.</p>
<p>The present dataset was confirmed to be (i) accurate; (ii) sufficiently complete by current standards; (iii) consistent with genomic recourse of other closely related species; and (iv) reliably reusable for cooperative applications within the Thunnini tribe as well as within the entire Pelagiaria clade.</p>
</sec>
<sec id="s4">
<title>Phylogenetic Analyses</title>
<p>Single-copy orthologs were identified in the <italic>de novo</italic> assembled <italic>E. affinis</italic> genome and across genomes of <italic>Danio rerio</italic> (GCF_000002035.6) and 15 representative species of the Percomorpha clade: <italic>Anabas testudineus</italic> (GCF_900324465.2), <italic>Brotula barbata</italic> (GCA_900303265.1), <italic>G. aculeatus</italic> (GCA_000180675.1), <italic>Macroramphosus scolopax</italic> (GCA_901007825.1), <italic>O. niloticus</italic> (GCF_001858045.2), <italic>O. latipes</italic> (GCA_002234675.1), <italic>Paralichthys olivaceus</italic> (GCA_001904815.2), <italic>Periophthalmus magnuspinnatus</italic> (GCF_009829125.1), <italic>S. lalandi</italic> (GCA_003054885.1), <italic>S. aurata</italic> (GCF_900880675.1), <italic>Syngnathus acus</italic> (GCF_901709675.1), <italic>Thalassophryne amazonica</italic> (GCA_902500255.1), <italic>T. albacares</italic> (GCA_900302625.1), <italic>T. orientalis</italic> (GCA_009176245.1), and <italic>T. thynnus</italic> (GCA_003231725.1) by BUSCO v. 3.0.2 (Simao et al., <xref ref-type="bibr" rid="B55">2015</xref>). A total of 1,178 complete unduplicated BUSCO genes identified across genomes of all the above species were separately aligned in MAFFT v. 7.475 (Katoh and Standley, <xref ref-type="bibr" rid="B36">2013</xref>) using the BLOSUM62 matrix of substitutions (--bl 62). Each alignment was trimmed in trimAl v. 1.4.1 (Capella-Guti&#x000E9;rrez et al., <xref ref-type="bibr" rid="B8">2009</xref>) to remove sites of unclear homology using the heuristic method <italic>automated1</italic>. The resulting alignments were concatenated by catsequences v. 1.3. (Creevey, <xref ref-type="bibr" rid="B13">2021</xref>) (<xref ref-type="supplementary-material" rid="SM5">Supplementary File 3</xref>), and the species tree was inferred in IQ-TREE v. 2.0.3 (Nguyen et al., <xref ref-type="bibr" rid="B48">2015</xref>) letting ModelFinder (Kalyaanamoorthy et al., <xref ref-type="bibr" rid="B35">2017</xref>) select the optimal substitution model for each partition prior to running the tree interface with 1,000 ultrafast bootstrap replicates (Hoang et al., <xref ref-type="bibr" rid="B30">2018</xref>) and 1,000 replicates for the Shimodaira-Hasegawa-like approximate likelihood ratio test (SH-aLRT) (Guindon et al., <xref ref-type="bibr" rid="B27">2010</xref>). The divergence time was estimated with MCMCTree in the package PAML 4.9j (Yang, <xref ref-type="bibr" rid="B68">1997</xref>) using parameters with independent clock rates. Calibration divergence times of <italic>A. testudineus</italic> from <italic>S. lalandi</italic> (91&#x02013;102 million years ago [Mya]), <italic>T. orientalis</italic> from <italic>O. latipes</italic> (106&#x02013;144 Mya), and <italic>D. rerio</italic> from Percomorpha (206&#x02013;252 Mya) obtained from TimeTree database (Kumar et al., <xref ref-type="bibr" rid="B40">2017</xref>) were used as time scales to estimate the divergence time of <italic>E. affinis</italic> from other percomorph species. The final tree was drawn in FigTree v. 1.4.4 (Rambaut, <xref ref-type="bibr" rid="B52">2018</xref>).</p>
<p>Observed phylogenetic relationships were consistent with recent studies of phylogeny of the Percomorpha clade (Sanciangco et al., <xref ref-type="bibr" rid="B54">2016</xref>; Friedman et al., <xref ref-type="bibr" rid="B24">2019</xref>). The divergence time of <italic>E. affinis</italic> from a common tuna ancestor was inferred to be &#x0007E;46.9 Mya (<xref ref-type="supplementary-material" rid="SM6">Supplementary File 4</xref>; <xref ref-type="supplementary-material" rid="SM2">Supplementary Figure 2</xref>). This is more than twice the age estimated in the TimeTree database (Kumar et al., <xref ref-type="bibr" rid="B40">2017</xref>) but in agreement with the most recent study by Friedman et al. (<xref ref-type="bibr" rid="B24">2019</xref>).</p>
</sec>
<sec sec-type="data-availability" id="s5">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ddbj.nig.ac.jp/">https://www.ddbj.nig.ac.jp/</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="BPLY01000001">BPLY01000001</ext-link> - <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="BPLY01010237">BPLY01010237</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="ICRR01000001">ICRR01000001</ext-link> - <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="ICRR01049510">ICRR01049510</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="DRA012118">DRA012118</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="DRA012140">DRA012140</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="DRA012141">DRA012141</ext-link>, <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/">https://www.ncbi.nlm.nih.gov/</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA725361"></ext-link>, <ext-link ext-link-type="uri" xlink:href="https://figshare.com/">https://figshare.com/</ext-link>, doi: <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.6084/m9.figshare.14937774">10.6084/m9.figshare.14937774</ext-link>.</p>
</sec>
<sec id="s6">
<title>Ethics Statement</title>
<p>The animal study was reviewed and approved by Animal Care Committee of Ehime University.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>MH and ES: conceptualization, writing&#x02014;review and editing. MH, ES, TS, and KY: data curation. MH, ES, KY, and DS: formal analysis, investigation. MT, SA, and TM: funding acquisition. RG, MT, TM: project administration. TS, RG, TM, SA, and TI: resources. MH, ES, and KY: validation. MH and TS: visualization. MH and KY: writing original draft. MH: performed the majority of data analysis. DS, KY, TI, and SA contributed solely to tasks related to the production of interspecific hybrids and their subsequent analyses. All authors read and approved the final version of the manuscript.</p>
</sec>
<sec sec-type="funding-information" id="s8">
<title>Funding</title>
<p>The study was financially supported by the Ministry of Education, Culture, Sports, Science and Technology of Japan (MEXT) under the Regional Innovation and Ecosystem Formation Program (FY2017-2021); Bio-oriented Technology Research Advancement, Naro (BRAIN) under the special scheme project on regional developing strategy (16818524); and the National University Corporation Ehime University Research Fellow Employment Support Expenses (2021) under the special scheme project on regional developing strategy (ZK39b).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x00027;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec> 
</body>
<back>
<sec sec-type="supplementary-material" id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2021.739781/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2021.739781/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.TIF" id="SM1" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 1</label>
<caption><p>Length distribution of kawakawa <italic>Euthynnus affinis</italic> genome assembly.</p></caption></supplementary-material>
<supplementary-material xlink:href="Image_2.TIF" id="SM2" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 2</label>
<caption><p>Time-calibrated phylogeny of representative species of the nine major percomorph clades with zebrafish <italic>Danio rerio</italic> as outgroup.</p></caption></supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM3" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 1</label>
<caption><p>Genetic linkage information of each marker with its location in both scaffold level assembly and pseudochromosome level assembly.</p></caption></supplementary-material>
<supplementary-material xlink:href="Data_Sheet_2.CSV" id="SM4" mimetype="text/csv" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 2</label>
<caption><p>Major categories and quantities of repeat elements in <italic>E. affinis</italic> genome assembly.</p></caption></supplementary-material>
<supplementary-material xlink:href="Data_Sheet_3.PDF" id="SM5" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 3</label>
<caption><p>Nucleotide alignment of 1,179 single copy orthologs of <italic>Euthynnus affinis, Danio rerio</italic> and 15 representative species of Percomorpha clade.</p></caption></supplementary-material>
<supplementary-material xlink:href="Data_Sheet_4.ZIP" id="SM6" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File 4</label>
<caption><p>Phylogenetic tree and partition information giving position of each gene in the alignment and substitution model for each gene.</p></caption></supplementary-material>
<supplementary-material xlink:href="Table_1.DOCX" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 1</label>
<caption><p>Results of genome characteristics estimate for three k-mers (19, 21, and 23).</p></caption></supplementary-material>
<supplementary-material xlink:href="Table_2.XLSX" id="SM8" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 2</label>
<caption><p>Detailed data for all specimens used for genotyping by sequencing and linkage mapping. These include phenotype data, the number of sequencing reads and length of the data before and after trimming, and results of mapping of trimmed reads of each specimen to <italic>E. affinis</italic> genome assembly.</p></caption></supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Andrews</surname> <given-names>S.</given-names></name></person-group> (<year>2020</year>). <source>FastQC Version 0.11.9</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/s-andrews/FastQC">https://github.com/s-andrews/FastQC</ext-link> (accessed February 13, 2021).</citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aramaki</surname> <given-names>T.</given-names></name> <name><surname>Blanc-Mathieu</surname> <given-names>R.</given-names></name> <name><surname>Endo</surname> <given-names>H.</given-names></name> <name><surname>Ohkubo</surname> <given-names>K.</given-names></name> <name><surname>Kanehisa</surname> <given-names>M.</given-names></name> <name><surname>Goto</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>KofamKOALA: KEGG Ortholog assignment based on profile HMM and adaptive score threshold</article-title>. <source>Bioinformatics</source> <volume>36</volume>, <fpage>2251</fpage>&#x02013;<lpage>2252</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz859</pub-id><pub-id pub-id-type="pmid">31742321</pub-id></citation></ref>
<ref id="B3">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Benestan</surname> <given-names>L.</given-names></name></person-group> (<year>2020</year>). <article-title>Population genomics applied to fishery management and conservation,</article-title> in <source>Population Genomics: Marine Organisms</source>, eds <person-group person-group-type="editor"><name><surname>Oleksiak</surname> <given-names>M. F.</given-names></name> <name><surname>Rajora</surname> <given-names>O. P.</given-names></name></person-group>  (<publisher-loc>Cham</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name>), <fpage>399</fpage>&#x02013;<lpage>421</lpage>. <pub-id pub-id-type="doi">10.1007/13836_2019_66</pub-id></citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bernal</surname> <given-names>D.</given-names></name> <name><surname>Brill</surname> <given-names>R. W.</given-names></name> <name><surname>Dickson</surname> <given-names>K. A.</given-names></name> <name><surname>Shiels</surname> <given-names>H. A.</given-names></name></person-group> (<year>2017</year>). <article-title>Sharing the water column: physiological mechanisms underlying species-specific habitat use in tunas</article-title>. <source>Rev. Fish Biol. Fish</source>. <volume>27</volume>, <fpage>843</fpage>&#x02013;<lpage>880</lpage>. <pub-id pub-id-type="doi">10.1007/s11160-017-9497-7</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bridson</surname> <given-names>P. B.</given-names></name> <name><surname>Stoner</surname> <given-names>J. M. S.</given-names></name> <name><surname>Fransen</surname> <given-names>M. H.</given-names></name> <name><surname>Ireland</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>The aquaculture sustainability continuum &#x02013; Defining an environmental performance framework</article-title>. <source>Environ. Sustain. Indic</source>. <volume>8</volume>:<fpage>100050</fpage>. <pub-id pub-id-type="doi">10.1016/j.indic.2020.100050</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Bushnell</surname> <given-names>B.</given-names></name></person-group> (<year>2014</year>). <source>BBMap Version 38.87</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://sourceforge.net/projects/bbmap/">https://sourceforge.net/projects/bbmap/</ext-link> (accessed September 29, 2020).</citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Camacho</surname> <given-names>C.</given-names></name> <name><surname>Coulouris</surname> <given-names>G.</given-names></name> <name><surname>Avagyan</surname> <given-names>V.</given-names></name> <name><surname>Ma</surname> <given-names>N.</given-names></name> <name><surname>Papadopoulos</surname> <given-names>J.</given-names></name> <name><surname>Bealer</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2009</year>). <article-title>BLAST&#x0002B;: architecture and applications</article-title>. <source>BMC Bioinformatics</source> <volume>10</volume>:<fpage>421</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-10-421</pub-id><pub-id pub-id-type="pmid">20003500</pub-id></citation></ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Capella-Guti&#x000E9;rrez</surname> <given-names>S.</given-names></name> <name><surname>Silla-Mart&#x000ED;nez</surname> <given-names>J. M.</given-names></name> <name><surname>Gabald&#x000F3;n</surname> <given-names>T.</given-names></name></person-group> (<year>2009</year>). <article-title>trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>25</volume>, <fpage>1972</fpage>&#x02013;<lpage>1973</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp348</pub-id><pub-id pub-id-type="pmid">19505945</pub-id></citation></ref>
<ref id="B9">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Card</surname> <given-names>D.</given-names></name></person-group> (<year>2017</year>). <source>Genome Annotation Using MAKER. 2017</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://darencard.net/blog/2017-05-16-maker-genome-annotation/">https://darencard.net/blog/2017-05-16-maker-genome-annotation/</ext-link> (accessed September 23, 2020).</citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cartwright</surname> <given-names>D. A.</given-names></name> <name><surname>Troggio</surname> <given-names>M.</given-names></name> <name><surname>Velasco</surname> <given-names>R.</given-names></name> <name><surname>Gutin</surname> <given-names>A.</given-names></name></person-group> (<year>2007</year>). <article-title>Genetic mapping in the presence of genotyping errors</article-title>. <source>Genetics</source> <volume>176</volume>, <fpage>2521</fpage>&#x02013;<lpage>2527</lpage>. <pub-id pub-id-type="doi">10.1534/genetics.106.063982</pub-id><pub-id pub-id-type="pmid">17277374</pub-id></citation></ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>C.</given-names></name> <name><surname>Chen</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name> <name><surname>Thomas</surname> <given-names>H. R.</given-names></name> <name><surname>Frank</surname> <given-names>M. H.</given-names></name> <name><surname>He</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>TBtools: an integrative toolkit developed for interactive analyses of big biological data</article-title>. <source>Mol. Plant</source> <volume>13</volume>, <fpage>1194</fpage>&#x02013;<lpage>1202</lpage>. <pub-id pub-id-type="doi">10.1016/j.molp.2020.06.009</pub-id><pub-id pub-id-type="pmid">32585190</pub-id></citation></ref>
<ref id="B12">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Collette</surname> <given-names>B.</given-names></name></person-group> (<year>2001</year>). <article-title>Tunas (also, albacore, bonitos, mackerels, seerfishes, and wahoo),</article-title> in <source>FAO Species Identification Guide for Fishery Purposes The Living Marine Resources of the Western Central Pacific</source>, eds <person-group person-group-type="editor"><name><surname>Carpenter</surname> <given-names>K. E.</given-names></name> <name><surname>Niem</surname> <given-names>V. H.</given-names></name></person-group> (<publisher-loc>Rome</publisher-loc>: <publisher-name>FAO</publisher-name>), <fpage>3721</fpage>&#x02013;<lpage>3735</lpage>.</citation>
</ref>
<ref id="B13">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Creevey</surname> <given-names>C.</given-names></name></person-group> (<year>2021</year>). <source>Catsequences Version 1.3</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/ChrisCreevey/catsequences/tree/73c11ef">https://github.com/ChrisCreevey/catsequences/tree/73c11ef</ext-link> (accessed January 21, 2021).</citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Crescente</surname> <given-names>J. M.</given-names></name> <name><surname>Zavallo</surname> <given-names>D.</given-names></name> <name><surname>Helguera</surname> <given-names>M.</given-names></name> <name><surname>Vanzetti</surname> <given-names>L. S.</given-names></name></person-group> (<year>2018</year>). <article-title>MITE Tracker: an accurate approach to identify miniature inverted-repeat transposable elements in large genomes</article-title>. <source>BMC Bioinformatics</source> <volume>19</volume>:<fpage>348</fpage>. <pub-id pub-id-type="doi">10.1186/s12859-018-2376-y</pub-id><pub-id pub-id-type="pmid">30285604</pub-id></citation></ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Danecek</surname> <given-names>P.</given-names></name> <name><surname>Auton</surname> <given-names>A.</given-names></name> <name><surname>Abecasis</surname> <given-names>G.</given-names></name> <name><surname>Albers</surname> <given-names>C. A.</given-names></name> <name><surname>Banks</surname> <given-names>E.</given-names></name> <name><surname>DePristo</surname> <given-names>M. A.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>The variant call format and VCFtools</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>27</volume>, <fpage>2156</fpage>&#x02013;<lpage>2158</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr330</pub-id><pub-id pub-id-type="pmid">21653522</pub-id></citation></ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Danecek</surname> <given-names>P.</given-names></name> <name><surname>Bonfield</surname> <given-names>J. K.</given-names></name> <name><surname>Liddle</surname> <given-names>J.</given-names></name> <name><surname>Marshall</surname> <given-names>J.</given-names></name> <name><surname>Ohan</surname> <given-names>V.</given-names></name> <name><surname>Pollard</surname> <given-names>M. O.</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Twelve years of SAMtools and BCFtools</article-title>. <source>Gigascience</source> <volume>10</volume>:<fpage>giab008</fpage>. <pub-id pub-id-type="doi">10.1093/gigascience/giab008</pub-id><pub-id pub-id-type="pmid">33590861</pub-id></citation></ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davidson</surname> <given-names>N. M.</given-names></name> <name><surname>Hawkins</surname> <given-names>A. D. K.</given-names></name> <name><surname>Oshlack</surname> <given-names>A.</given-names></name></person-group> (<year>2017</year>). <article-title>SuperTranscripts: a data driven reference for analysis and visualisation of transcriptomes</article-title>. <source>Genome Biol</source>. <volume>18</volume>:<fpage>148</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-017-1284-1</pub-id><pub-id pub-id-type="pmid">28836999</pub-id></citation></ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dickson</surname> <given-names>K. A.</given-names></name> <name><surname>Johnson</surname> <given-names>N. M.</given-names></name> <name><surname>Donley</surname> <given-names>J. M.</given-names></name> <name><surname>Hoskinson</surname> <given-names>J. A.</given-names></name> <name><surname>Hansen</surname> <given-names>M. W.</given-names></name> <name><surname>Tessier</surname> <given-names>J. D. S.</given-names></name></person-group> (<year>2000</year>). <article-title>Ontogenetic changes in characteristics required for endothermy in juvenile black skipjack tuna (<italic>Euthynnus lineatus</italic>)</article-title>. <source>J. Exp. Biol</source>. <volume>203</volume>, <fpage>3077</fpage>&#x02013;<lpage>3087</lpage>. <pub-id pub-id-type="doi">10.1242/jeb.203.20.3077</pub-id><pub-id pub-id-type="pmid">11003819</pub-id></citation></ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Donley</surname> <given-names>J. M.</given-names></name> <name><surname>Dickson</surname> <given-names>K. A.</given-names></name></person-group> (<year>2000</year>). <article-title>Swimming kinematics of juvenile kawakawa tuna (<italic>Euthynnus affinis</italic>) and chub mackerel (<italic>Scomber japonicus</italic>)</article-title>. <source>J. Exp. Biol</source>. <volume>203</volume>, <fpage>3103</fpage>&#x02013;<lpage>3116</lpage>. <pub-id pub-id-type="doi">10.1242/jeb.203.20.3103</pub-id><pub-id pub-id-type="pmid">11003821</pub-id></citation></ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Du</surname> <given-names>K.</given-names></name> <name><surname>St&#x000F6;ck</surname> <given-names>M.</given-names></name> <name><surname>Kneitz</surname> <given-names>S.</given-names></name> <name><surname>Klopp</surname> <given-names>C.</given-names></name> <name><surname>Woltering</surname> <given-names>J. M.</given-names></name> <name><surname>Adolfi</surname> <given-names>M. C.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>The sterlet sturgeon genome sequence and the mechanisms of segmental rediploidization</article-title>. <source>Nat. Ecol. Evol</source>. <volume>4</volume>, <fpage>841</fpage>&#x02013;<lpage>852</lpage>. <pub-id pub-id-type="doi">10.1038/s41559-020-1166-x</pub-id><pub-id pub-id-type="pmid">32231327</pub-id></citation></ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emms</surname> <given-names>D. M.</given-names></name> <name><surname>Kelly</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>OrthoFinder: solving fundamental biases in whole genome comparisons dramatically improves orthogroup inference accuracy</article-title>. <source>Genome Biol</source>. <volume>16</volume>:<fpage>157</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-015-0721-2</pub-id><pub-id pub-id-type="pmid">26243257</pub-id></citation></ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>English</surname> <given-names>A. C.</given-names></name> <name><surname>Richards</surname> <given-names>S.</given-names></name> <name><surname>Han</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Vee</surname> <given-names>V.</given-names></name> <name><surname>Qu</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>Mind the gap: upgrading genomes with Pacific Biosciences RS long-read sequencing technology</article-title>. <source>PLoS ONE</source> <volume>7</volume>:<fpage>e47768</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0047768</pub-id><pub-id pub-id-type="pmid">23185243</pub-id></citation></ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Flynn</surname> <given-names>J. M.</given-names></name> <name><surname>Hubley</surname> <given-names>R.</given-names></name> <name><surname>Goubert</surname> <given-names>C.</given-names></name> <name><surname>Rosen</surname> <given-names>J.</given-names></name> <name><surname>Clark</surname> <given-names>A. G.</given-names></name> <name><surname>Feschotte</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>RepeatModeler2 for automated genomic discovery of transposable element families</article-title>. <source>Proc. Natl. Acad. Sci</source>. <volume>117</volume>, <fpage>9451</fpage>&#x02013;<lpage>9457</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1921046117</pub-id><pub-id pub-id-type="pmid">32300014</pub-id></citation></ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Friedman</surname> <given-names>M.</given-names></name> <name><surname>Feilich</surname> <given-names>K. L.</given-names></name> <name><surname>Beckett</surname> <given-names>H. T.</given-names></name> <name><surname>Alfaro</surname> <given-names>M. E.</given-names></name> <name><surname>Faircloth</surname> <given-names>B. C.</given-names></name> <name><surname>Cern&#x000FD;</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>A phylogenomic framework for pelagiarian fishes (Acanthomorpha: Percomorpha) highlights mosaic radiation in the open ocean</article-title>. <source>Proc. Biol. Sci</source>. <volume>286</volume>:<fpage>20191502</fpage>. <pub-id pub-id-type="doi">10.1098/rspb.2019.1502</pub-id><pub-id pub-id-type="pmid">31506051</pub-id></citation></ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Yassour</surname> <given-names>M.</given-names></name> <name><surname>Levin</surname> <given-names>J. Z.</given-names></name> <name><surname>Thompson</surname> <given-names>D. A.</given-names></name> <name><surname>Amit</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome</article-title>. <source>Nat. Biotechnol</source>. <volume>29</volume>, <fpage>644</fpage>&#x02013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id><pub-id pub-id-type="pmid">21572440</pub-id></citation></ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Griffiths</surname> <given-names>S. P.</given-names></name> <name><surname>Kuhnert</surname> <given-names>P. M.</given-names></name> <name><surname>Fry</surname> <given-names>G. F.</given-names></name> <name><surname>Manson</surname> <given-names>F. J.</given-names></name></person-group> (<year>2009</year>). <article-title>Temporal and size-related variation in the diet, consumption rate, and daily ration of mackerel tuna (<italic>Euthynnus affinis</italic>) in neritic waters of eastern Australia</article-title>. <source>ICES J. Marine Sci</source>. <volume>66</volume>, <fpage>720</fpage>&#x02013;<lpage>733</lpage>. <pub-id pub-id-type="doi">10.1093/icesjms/fsp065</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guindon</surname> <given-names>S.</given-names></name> <name><surname>Dufayard</surname> <given-names>J.-F.</given-names></name> <name><surname>Lefort</surname> <given-names>V.</given-names></name> <name><surname>Anisimova</surname> <given-names>M.</given-names></name> <name><surname>Hordijk</surname> <given-names>W.</given-names></name> <name><surname>Gascuel</surname> <given-names>O.</given-names></name></person-group> (<year>2010</year>). <article-title>New algorithms and methods to estimate maximum-likelihood phylogenies: assessing the performance of PhyML 3.0</article-title>. <source>Syst. Biol</source>. <volume>59</volume>, <fpage>307</fpage>&#x02013;<lpage>321</lpage>. <pub-id pub-id-type="doi">10.1093/sysbio/syq010</pub-id><pub-id pub-id-type="pmid">20525638</pub-id></citation></ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hara</surname> <given-names>Y.</given-names></name> <name><surname>Tatsumi</surname> <given-names>K.</given-names></name> <name><surname>Yoshida</surname> <given-names>M.</given-names></name> <name><surname>Kajikawa</surname> <given-names>E.</given-names></name> <name><surname>Kiyonari</surname> <given-names>H.</given-names></name> <name><surname>Kuraku</surname> <given-names>S.</given-names></name></person-group> (<year>2015</year>). <article-title>Optimizing and benchmarking de novo transcriptome sequencing: from library preparation to assembly evaluation</article-title>. <source>BMC Genomics</source> <volume>16</volume>:<fpage>977</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-015-2007-1</pub-id><pub-id pub-id-type="pmid">26581708</pub-id></citation></ref>
<ref id="B29">
<citation citation-type="thesis"><person-group person-group-type="author"><name><surname>Harris</surname> <given-names>R. S.</given-names></name></person-group> (<year>2007</year>). <source>Improved pairwise alignment of genomic DNA</source> (Disertation thesis). The Pennsylvania State University, United States, State College, PA.</citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hoang</surname> <given-names>D. T.</given-names></name> <name><surname>Chernomor</surname> <given-names>O.</given-names></name> <name><surname>von Haeseler</surname> <given-names>A.</given-names></name> <name><surname>Minh</surname> <given-names>B. Q.</given-names></name> <name><surname>Vinh</surname> <given-names>L. S.</given-names></name></person-group> (<year>2018</year>). <article-title>UFBoot2: Improving the Ultrafast Bootstrap approximation</article-title>. <source>Mol. Biol. Evol</source>. <volume>35</volume>, <fpage>518</fpage>&#x02013;<lpage>522</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx281</pub-id><pub-id pub-id-type="pmid">29077904</pub-id></citation></ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holt</surname> <given-names>C.</given-names></name> <name><surname>Yandell</surname> <given-names>M.</given-names></name></person-group> (<year>2011</year>). <article-title>MAKER2: an annotation pipeline and genome-database management tool for second-generation genome projects</article-title>. <source>BMC Bioinformatics</source> <volume>12</volume>:<fpage>491</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-12-491</pub-id><pub-id pub-id-type="pmid">22192575</pub-id></citation></ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hosoya</surname> <given-names>S.</given-names></name> <name><surname>Hirase</surname> <given-names>S.</given-names></name> <name><surname>Kikuchi</surname> <given-names>K.</given-names></name> <name><surname>Nanjo</surname> <given-names>K.</given-names></name> <name><surname>Nakamura</surname> <given-names>Y.</given-names></name> <name><surname>Kohno</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Random PCR-based genotyping by sequencing technology GRAS-Di (genotyping by random amplicon sequencing, direct) reveals genetic structure of mangrove fishes</article-title>. <source>Mol. Ecol. Resour</source>. <volume>19</volume>, <fpage>1153</fpage>&#x02013;<lpage>1163</lpage>. <pub-id pub-id-type="doi">10.1111/1755-0998.13025</pub-id><pub-id pub-id-type="pmid">31009151</pub-id></citation></ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hughes</surname> <given-names>L. C.</given-names></name> <name><surname>Ort&#x000ED;</surname> <given-names>G.</given-names></name> <name><surname>Huang</surname> <given-names>Y.</given-names></name> <name><surname>Sun</surname> <given-names>Y.</given-names></name> <name><surname>Baldwin</surname> <given-names>C. C.</given-names></name> <name><surname>Thompson</surname> <given-names>A. W.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Comprehensive phylogeny of ray-finned fishes (Actinopterygii) based on transcriptomic and genomic data</article-title>. <source>Proc. Natl. Acad. Sci</source>. <volume>115</volume>, <fpage>6249</fpage>&#x02013;<lpage>6254</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1719358115</pub-id><pub-id pub-id-type="pmid">29760103</pub-id></citation></ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>P.</given-names></name> <name><surname>Binns</surname> <given-names>D.</given-names></name> <name><surname>Chang</surname> <given-names>H. Y.</given-names></name> <name><surname>Fraser</surname> <given-names>M.</given-names></name> <name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>McAnulla</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>InterProScan 5: genome-scale protein function classification</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>30</volume>, <fpage>1236</fpage>&#x02013;<lpage>1240</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu031</pub-id><pub-id pub-id-type="pmid">24451626</pub-id></citation></ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kalyaanamoorthy</surname> <given-names>S.</given-names></name> <name><surname>Minh</surname> <given-names>B. Q.</given-names></name> <name><surname>Wong</surname> <given-names>T. K. F.</given-names></name> <name><surname>von Haeseler</surname> <given-names>A.</given-names></name> <name><surname>Jermiin</surname> <given-names>L. S.</given-names></name></person-group> (<year>2017</year>). <article-title>ModelFinder: fast model selection for accurate phylogenetic estimates</article-title>. <source>Nat. Methods</source> <volume>14</volume>, <fpage>587</fpage>&#x02013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.4285</pub-id><pub-id pub-id-type="pmid">28481363</pub-id></citation></ref>
<ref id="B36">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname> <given-names>K.</given-names></name> <name><surname>Standley</surname> <given-names>D. M.</given-names></name></person-group> (<year>2013</year>). <article-title>MAFFT multiple sequence alignment software version 7: improvements in performance and usability</article-title>. <source>Mol. Biol. Evol</source>. <volume>30</volume>, <fpage>772</fpage>&#x02013;<lpage>780</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id><pub-id pub-id-type="pmid">23329690</pub-id></citation></ref>
<ref id="B37">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kerkvliet</surname> <given-names>J.</given-names></name> <name><surname>de Fouchier</surname> <given-names>A.</given-names></name> <name><surname>van Wijk</surname> <given-names>M.</given-names></name> <name><surname>Groot</surname> <given-names>A. T.</given-names></name></person-group> (<year>2019</year>). <article-title>The Bellerophon pipeline, improving de novo transcriptomes and removing chimeras</article-title>. <source>Ecol. Evol</source>. <volume>9</volume>, <fpage>10513</fpage>&#x02013;<lpage>10521</lpage>. <pub-id pub-id-type="doi">10.1002/ece3.5571</pub-id><pub-id pub-id-type="pmid">31624564</pub-id></citation></ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Korf</surname> <given-names>I.</given-names></name></person-group> (<year>2004</year>). <article-title>Gene finding in novel genomes</article-title>. <source>BMC Bioinformatics</source> <volume>5</volume>:<fpage>59</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-5-59</pub-id><pub-id pub-id-type="pmid">15144565</pub-id></citation></ref>
<ref id="B39">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Krueger</surname> <given-names>F.</given-names></name></person-group> (<year>2019</year>). <source>TrimGalore Version 0.6.4</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/FelixKrueger/TrimGalore">https://github.com/FelixKrueger/TrimGalore</ext-link> (accessed March 1, 2021).</citation>
</ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>S.</given-names></name> <name><surname>Stecher</surname> <given-names>G.</given-names></name> <name><surname>Suleski</surname> <given-names>M.</given-names></name> <name><surname>Hedges</surname> <given-names>S. B.</given-names></name></person-group> (<year>2017</year>). <article-title>TimeTree: a resource for timelines, timetrees, and divergence times</article-title>. <source>Mol. Biol. Evol</source>. <volume>34</volume>, <fpage>1812</fpage>&#x02013;<lpage>1819</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msx116</pub-id><pub-id pub-id-type="pmid">28387841</pub-id></citation></ref>
<ref id="B41">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Langmead</surname> <given-names>B.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Fast gapped-read alignment with Bowtie 2</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>357</fpage>&#x02013;<lpage>359</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1923</pub-id><pub-id pub-id-type="pmid">22388286</pub-id></citation></ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Durbin</surname> <given-names>R.</given-names></name></person-group> (<year>2009</year>). <article-title>Fast and accurate short read alignment with Burrows-Wheeler transform</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>25</volume>, <fpage>1754</fpage>&#x02013;<lpage>1760</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp324</pub-id><pub-id pub-id-type="pmid">19451168</pub-id></citation></ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>W.</given-names></name> <name><surname>Godzik</surname> <given-names>A.</given-names></name></person-group> (<year>2006</year>). <article-title>Cd-hit: a fast program for clustering and comparing large sets of protein or nucleotide sequences</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>22</volume>, <fpage>1658</fpage>&#x02013;<lpage>1659</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btl158</pub-id><pub-id pub-id-type="pmid">16731699</pub-id></citation></ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lien</surname> <given-names>S.</given-names></name> <name><surname>Koop</surname> <given-names>B. F.</given-names></name> <name><surname>Sandve</surname> <given-names>S. R.</given-names></name> <name><surname>Miller</surname> <given-names>J. R.</given-names></name> <name><surname>Kent</surname> <given-names>M. P.</given-names></name> <name><surname>Nome</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>The Atlantic salmon genome provides insights into rediploidization</article-title>. <source>Nature</source> <volume>533</volume>, <fpage>200</fpage>&#x02013;<lpage>205</lpage>. <pub-id pub-id-type="doi">10.1038/nature17164</pub-id><pub-id pub-id-type="pmid">27088604</pub-id></citation></ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lu</surname> <given-names>G.</given-names></name> <name><surname>Luo</surname> <given-names>M.</given-names></name></person-group> (<year>2020</year>). <article-title>Genomes of major fishes in world fisheries and aquaculture: Status, application and perspective</article-title>. <source>Aquacult. Fish</source>. <volume>5</volume>, <fpage>163</fpage>&#x02013;<lpage>173</lpage>. <pub-id pub-id-type="doi">10.1016/j.aaf.2020.05.004</pub-id></citation>
</ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x000E7;ais</surname> <given-names>G.</given-names></name> <name><surname>Kingsford</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>A fast, lock-free approach for efficient parallel counting of occurrences of k-mers</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>27</volume>, <fpage>764</fpage>&#x02013;<lpage>770</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr011</pub-id><pub-id pub-id-type="pmid">21217122</pub-id></citation></ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mukundan</surname> <given-names>M. K.</given-names></name> <name><surname>Arul</surname> <given-names>J. M.</given-names></name> <name><surname>Radhakrishnan</surname> <given-names>A. G.</given-names></name> <name><surname>Antony</surname> <given-names>P. D.</given-names></name></person-group> (<year>1979</year>). <article-title>Red and white meat of tune (<italic>Euthynnus affinis</italic>); their biochemical role and nutritional quality. Fish</article-title>. <source>Technol</source>. <volume>16</volume>, <fpage>72</fpage>&#x02013;<lpage>82</lpage>.</citation>
</ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nguyen</surname> <given-names>L. T.</given-names></name> <name><surname>Schmidt</surname> <given-names>H. A.</given-names></name> <name><surname>von Haeseler</surname> <given-names>A.</given-names></name> <name><surname>Minh</surname> <given-names>B. Q.</given-names></name></person-group> (<year>2015</year>). <article-title>IQ-TREE: a fast and effective stochastic algorithm for estimating maximum-likelihood phylogenies</article-title>. <source>Mol. Biol. Evol</source>. <volume>32</volume>, <fpage>268</fpage>&#x02013;<lpage>274</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msu300</pub-id><pub-id pub-id-type="pmid">25371430</pub-id></citation></ref>
<ref id="B49">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nishimura</surname> <given-names>O.</given-names></name> <name><surname>Hara</surname> <given-names>Y.</given-names></name> <name><surname>Kuraku</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>gVolante for standardizing completeness assessment of genome and transcriptome assemblies</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>33</volume>, <fpage>3635</fpage>&#x02013;<lpage>3637</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx445</pub-id><pub-id pub-id-type="pmid">29036533</pub-id></citation></ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>O&#x00027;Leary</surname> <given-names>N. A.</given-names></name> <name><surname>Wright</surname> <given-names>M. W.</given-names></name> <name><surname>Brister</surname> <given-names>J. R.</given-names></name> <name><surname>Ciufo</surname> <given-names>S.</given-names></name> <name><surname>Haddad</surname> <given-names>D.</given-names></name> <name><surname>McVeigh</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Reference sequence (RefSeq) database at NCBI: current status, taxonomic expansion, and functional annotation</article-title>. <source>Nucleic Acids Res</source>. <volume>44</volume>, <fpage>D733</fpage>&#x02013;<lpage>745</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv1189</pub-id><pub-id pub-id-type="pmid">26553804</pub-id></citation></ref>
<ref id="B51">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quast</surname> <given-names>C.</given-names></name> <name><surname>Pruesse</surname> <given-names>E.</given-names></name> <name><surname>Yilmaz</surname> <given-names>P.</given-names></name> <name><surname>Gerken</surname> <given-names>J.</given-names></name> <name><surname>Schweer</surname> <given-names>T.</given-names></name> <name><surname>Yarza</surname> <given-names>P.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>The SILVA ribosomal RNA gene database project: improved data processing and web-based tools</article-title>. <source>Nucleic Acids Res</source>. <volume>41</volume>, <fpage>D590</fpage>&#x02013;<lpage>D596</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gks1219</pub-id><pub-id pub-id-type="pmid">23193283</pub-id></citation></ref>
<ref id="B52">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Rambaut</surname> <given-names>A.</given-names></name></person-group> (<year>2018</year>). <source>FigTree Version 1.4.4</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/rambaut/figtree">https://github.com/rambaut/figtree</ext-link> (accessed April 19, 2021).</citation>
</ref>
<ref id="B53">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saito</surname> <given-names>H.</given-names></name> <name><surname>Yamashiro</surname> <given-names>R.</given-names></name> <name><surname>Ishihara</surname> <given-names>K.</given-names></name> <name><surname>Xue</surname> <given-names>C.</given-names></name></person-group> (<year>1999</year>). <article-title>Lipids of three highly migratory fishes: <italic>Euthynnus affinis, Sarda orientalis</italic>, and <italic>Elagatis bipinnulata</italic></article-title>. <source>Biosci. Biotechnol. Biochem</source>. <volume>63</volume>, <fpage>2028</fpage>&#x02013;<lpage>2030</lpage>. <pub-id pub-id-type="doi">10.1271/bbb.63.2028</pub-id></citation>
</ref>
<ref id="B54">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanciangco</surname> <given-names>M. D.</given-names></name> <name><surname>Carpenter</surname> <given-names>K. E.</given-names></name> <name><surname>Betancur</surname> <given-names>-R R</given-names></name></person-group>. (<year>2016</year>). <article-title>Phylogenetic placement of enigmatic percomorph families (Teleostei: Percomorphaceae)</article-title>. <source>Mol. Phylogen. Evol</source>. <volume>94</volume>, <fpage>565</fpage>&#x02013;<lpage>576</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2015.10.006</pub-id><pub-id pub-id-type="pmid">26493227</pub-id></citation></ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simao</surname> <given-names>F. A.</given-names></name> <name><surname>Waterhouse</surname> <given-names>R. M.</given-names></name> <name><surname>Ioannidis</surname> <given-names>P.</given-names></name> <name><surname>Kriventseva</surname> <given-names>E. V.</given-names></name> <name><surname>Zdobnov</surname> <given-names>E. M.</given-names></name></person-group> (<year>2015</year>). <article-title>BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>31</volume>, <fpage>3210</fpage>&#x02013;<lpage>3212</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv351</pub-id><pub-id pub-id-type="pmid">26059717</pub-id></citation></ref>
<ref id="B56">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Slater</surname> <given-names>G. S.</given-names></name> <name><surname>Birney</surname> <given-names>E.</given-names></name></person-group> (<year>2005</year>). <article-title>Automated generation of heuristics for biological sequence comparison</article-title>. <source>BMC Bioinformatics</source> <volume>6</volume>:<fpage>31</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-6-31</pub-id><pub-id pub-id-type="pmid">15713233</pub-id></citation></ref>
<ref id="B57">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Smit</surname> <given-names>A. F. A.</given-names></name> <name><surname>Hubley</surname> <given-names>R.</given-names></name> <name><surname>Green</surname> <given-names>P.</given-names></name></person-group> (<year>2015</year>). <source>RepeatMasker Open-4.0</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.repeatmasker.org">http://www.repeatmasker.org</ext-link> (accessed May 1, 2020).</citation>
</ref>
<ref id="B58">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>L.</given-names></name> <name><surname>Florea</surname> <given-names>L.</given-names></name></person-group> (<year>2015</year>). <article-title>Rcorrector: efficient and accurate error correction for Illumina RNA-seq reads</article-title>. <source>GigaScience</source> <volume>4</volume>:<fpage>48</fpage>. <pub-id pub-id-type="doi">10.1186/s13742-015-0089-y</pub-id><pub-id pub-id-type="pmid">26500767</pub-id></citation></ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Waack</surname> <given-names>S.</given-names></name></person-group> (<year>2003</year>). <article-title>Gene prediction with a hidden Markov model and a new intron submodel</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>19</volume>(<supplement>Suppl. 2</supplement>), <fpage>ii215</fpage>&#x02013;<lpage>ii225</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btg1080</pub-id><pub-id pub-id-type="pmid">14534192</pub-id></citation></ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Storer</surname> <given-names>J.</given-names></name> <name><surname>Hubley</surname> <given-names>R.</given-names></name> <name><surname>Rosen</surname> <given-names>J.</given-names></name> <name><surname>Wheeler</surname> <given-names>T. J.</given-names></name> <name><surname>Smit</surname> <given-names>A. F.</given-names></name></person-group> (<year>2021</year>). <article-title>The Dfam community resource of transposable element families, sequence models, and genome annotations</article-title>. <source>Mobile DNA</source> <volume>12</volume>:<fpage>2</fpage>. <pub-id pub-id-type="doi">10.1186/s13100-020-00230-y</pub-id><pub-id pub-id-type="pmid">33436076</pub-id></citation></ref>
<ref id="B61">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Suda</surname> <given-names>A.</given-names></name> <name><surname>Nishiki</surname> <given-names>I.</given-names></name> <name><surname>Iwasaki</surname> <given-names>Y.</given-names></name> <name><surname>Matsuura</surname> <given-names>A.</given-names></name> <name><surname>Akita</surname> <given-names>T.</given-names></name> <name><surname>Suzuki</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Improvement of the Pacific bluefin tuna (<italic>Thunnus orientalis</italic>) reference genome and development of male-specific DNA markers</article-title>. <source>Sci. Rep</source>. <volume>9</volume>:<fpage>14450</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-50978-4</pub-id><pub-id pub-id-type="pmid">31595011</pub-id></citation></ref>
<ref id="B62">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tang</surname> <given-names>H.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Miao</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Ming</surname> <given-names>R.</given-names></name> <name><surname>Schnable</surname> <given-names>J. C.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>ALLMAPS: robust scaffold ordering based on multiple maps</article-title>. <source>Genome Biol</source>. <volume>16</volume>:<fpage>3</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-014-0573-1</pub-id><pub-id pub-id-type="pmid">25583564</pub-id></citation></ref>
<ref id="B63">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Taranto</surname> <given-names>A.</given-names></name></person-group> (<year>2017</year>). <source>Yanagiba Version 1.0.0</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="https://github.com/Adamtaranto/Yanagiba">https://github.com/Adamtaranto/Yanagiba</ext-link> (accessed December 19, 2019).</citation>
</ref>
<ref id="B64">
<citation citation-type="journal"><person-group person-group-type="author"><collab>The UniProt Consortium</collab></person-group> (<year>2021</year>). <article-title>UniProt: the universal protein knowledgebase in 2021</article-title>. <source>Nucleic Acids Res</source>. <volume>49</volume>, <fpage>D480</fpage>&#x02013;<lpage>D489</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa1100</pub-id><pub-id pub-id-type="pmid">33237286</pub-id></citation></ref>
<ref id="B65">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Toll-Riera</surname> <given-names>M.</given-names></name> <name><surname>Rad&#x000F3;-Trilla</surname> <given-names>N.</given-names></name> <name><surname>Martys</surname> <given-names>F.</given-names></name> <name><surname>Alb,&#x000E0;</surname> <given-names>M. M.</given-names></name></person-group> (<year>2011</year>). <article-title>Role of low-complexity sequences in the formation of novel protein coding sequences</article-title>. <source>Mol. Biol. Evol</source>. <volume>29</volume>, <fpage>883</fpage>&#x02013;<lpage>886</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msr263</pub-id><pub-id pub-id-type="pmid">22045997</pub-id></citation></ref>
<ref id="B66">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vurture</surname> <given-names>G. W.</given-names></name> <name><surname>Sedlazeck</surname> <given-names>F. J.</given-names></name> <name><surname>Nattestad</surname> <given-names>M.</given-names></name> <name><surname>Underwood</surname> <given-names>C. J.</given-names></name> <name><surname>Fang</surname> <given-names>H.</given-names></name> <name><surname>Gurtowski</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>GenomeScope: fast reference-free genome profiling from short reads</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>33</volume>, <fpage>2202</fpage>&#x02013;<lpage>2204</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx153</pub-id><pub-id pub-id-type="pmid">28369201</pub-id></citation></ref>
<ref id="B67">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Wickham</surname> <given-names>H.</given-names></name></person-group> (<year>2016</year>). <source>ggplot2: Elegant Graphics for Data Analysis</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer International Publishing</publisher-name>. <pub-id pub-id-type="doi">10.1007/978-3-319-24277-4</pub-id></citation>
</ref>
<ref id="B68">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>Z.</given-names></name></person-group> (<year>1997</year>). <article-title>PAML: a program package for phylogenetic analysis by maximum likelihood</article-title>. <source>Comput. Appl. Biosci.</source> <volume>13</volume>, <fpage>555</fpage>&#x02013;<lpage>556</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/13.5.555</pub-id><pub-id pub-id-type="pmid">9367129</pub-id></citation></ref>
<ref id="B69">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yasuike</surname> <given-names>M.</given-names></name> <name><surname>Fujiwara</surname> <given-names>A.</given-names></name> <name><surname>Nakamura</surname> <given-names>Y.</given-names></name> <name><surname>Iwasaki</surname> <given-names>Y.</given-names></name> <name><surname>Nishiki</surname> <given-names>I.</given-names></name> <name><surname>Sugaya</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>A functional genomics tool for the Pacific bluefin tuna: development of a 44K oligonucleotide microarray from whole-genome sequencing data for global transcriptome analysis</article-title>. <source>Gene</source> <volume>576</volume>(<issue>2 Pt 1</issue>), <fpage>603</fpage>&#x02013;<lpage>609</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2015.10.023</pub-id><pub-id pub-id-type="pmid">26477480</pub-id></citation></ref>
<ref id="B70">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yates</surname> <given-names>A. D.</given-names></name> <name><surname>Achuthan</surname> <given-names>P.</given-names></name> <name><surname>Akanni</surname> <given-names>W.</given-names></name> <name><surname>Allen</surname> <given-names>J.</given-names></name> <name><surname>Allen</surname> <given-names>J.</given-names></name> <name><surname>Alvarez-Jarreta</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2019</year>). <article-title>Ensembl 2020</article-title>. <source>Nucleic Acids Res</source>. <volume>48</volume>, <fpage>D682</fpage>&#x02013;<lpage>D688</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz966</pub-id><pub-id pub-id-type="pmid">31691826</pub-id></citation></ref>
<ref id="B71">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yazawa</surname> <given-names>R.</given-names></name> <name><surname>Takeuchi</surname> <given-names>Y.</given-names></name> <name><surname>Amezawa</surname> <given-names>K.</given-names></name> <name><surname>Sato</surname> <given-names>K.</given-names></name> <name><surname>Iwata</surname> <given-names>G.</given-names></name> <name><surname>Kabeya</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>GnRHa-induced spawning of the Eastern little tuna (<italic>Euthynnus affinis</italic>) in a 70-m3 land-based tank</article-title>. <source>Aquaculture</source> <volume>442</volume>, <fpage>58</fpage>&#x02013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.1016/j.aquaculture.2015.01.016</pub-id></citation>
</ref>
<ref id="B72">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yazawa</surname> <given-names>R.</given-names></name> <name><surname>Takeuchi</surname> <given-names>Y.</given-names></name> <name><surname>Satoh</surname> <given-names>K.</given-names></name> <name><surname>Machida</surname> <given-names>Y.</given-names></name> <name><surname>Amezawa</surname> <given-names>K.</given-names></name> <name><surname>Kabeya</surname> <given-names>N.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>Eastern little tuna, <italic>Euthynnus affinis</italic> (Cantor, 1849) mature and reproduce within 1 year of rearing in land-based tanks</article-title>. <source>Aquacult. Res</source>. <volume>47</volume>, <fpage>3800</fpage>&#x02013;<lpage>3810</lpage>. <pub-id pub-id-type="doi">10.1111/are.12831</pub-id></citation>
</ref>
<ref id="B73">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yoshitake</surname> <given-names>K.</given-names></name> <name><surname>Igarashi</surname> <given-names>Y.</given-names></name> <name><surname>Mizukoshi</surname> <given-names>M.</given-names></name> <name><surname>Kinoshita</surname> <given-names>S.</given-names></name> <name><surname>Mitsuyama</surname> <given-names>S.</given-names></name> <name><surname>Suzuki</surname> <given-names>Y.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Artificially designed hybrids facilitate efficient generation of high-resolution linkage maps</article-title>. <source>Sci. Rep</source>. <volume>8</volume>:<fpage>16104</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-34431-6</pub-id><pub-id pub-id-type="pmid">30382134</pub-id></citation></ref>
<ref id="B74">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Ouyang</surname> <given-names>Y.</given-names></name> <name><surname>Yao</surname> <given-names>W.</given-names></name></person-group> (<year>2018</year>). <article-title>shinyCircos: an R/Shiny application for interactive creation of Circos plot</article-title>. <source>Bioinformatics (Oxford, England)</source> <volume>34</volume>, <fpage>1229</fpage>&#x02013;<lpage>1231</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx763</pub-id><pub-id pub-id-type="pmid">29186362</pub-id></citation></ref>
<ref id="B75">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>Z.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Zhou</surname> <given-names>T.</given-names></name> <name><surname>Tian</surname> <given-names>C.</given-names></name> <name><surname>Bao</surname> <given-names>L.</given-names></name> <name><surname>Dunham</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2018</year>). <article-title>Comparative genome analysis of 52 fish species suggests differential associations of repetitive elements with their living aquatic environments</article-title>. <source>BMC Genomics</source> <volume>19</volume>:<fpage>141</fpage>. <pub-id pub-id-type="doi">10.1186/s12864-018-4516-1</pub-id><pub-id pub-id-type="pmid">29439662</pub-id></citation></ref>
</ref-list> 
</back>
</article> 