<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Physiol.</journal-id>
<journal-title>Frontiers in Physiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Physiol.</abbrev-journal-title>
<issn pub-type="epub">1664-042X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fphys.2018.01833</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Physiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Phylogenomic Framework and Divergence History of Cephalochordata Amphioxus</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Qi-Lin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/517288/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Guan-Ling</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yuan</surname> <given-names>Ming-Long</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Dong</surname> <given-names>Zhi-Xiang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Hong-Wei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Guo</surname> <given-names>Jun</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Feng</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Deng</surname> <given-names>Xian-Yu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname> <given-names>Jun-Yuan</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/599376/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Lin</surname> <given-names>Lian-Bing</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
</contrib></contrib-group>
<aff id="aff1"><sup>1</sup><institution>Faculty of Life Science and Technology, Kunming University of Science and Technology</institution>, <addr-line>Kunming</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Evo-Devo Institute, School of Life Sciences, Nanjing University</institution>, <addr-line>Nanjing</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>State Key Laboratory of Grassland Agro-Ecosystems, College of Pastoral Agricultural Science and Technology, Lanzhou University</institution>, <addr-line>Lanzhou</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>State Key Laboratory of Palaeobiology and Stratigraphy (LPS), Nanjing Institute of Geology and Palaeontology, Chinese Academy of Sciences</institution>, <addr-line>Nanjing</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Ruriko Yoshida, University of Kentucky, United States</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Neil Moore, University of Kentucky, United States; Grady Weyenberg, University of Hawaii at Hilo, United States; Joseph Rusinko, Hobart and William Smith Colleges, United States</p></fn>
<corresp id="c001">&#x002A;Correspondence: Jun-Yuan Chen, <email>chenjy@nju.edu.cn</email> Lian-Bing Lin, <email>linlb@kmust.edu.cn</email></corresp>
<fn fn-type="other" id="fn002"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn fn-type="other" id="fn003"><p>This article was submitted to Systems Biology, a section of the journal Frontiers in Physiology</p></fn></author-notes>
<pub-date pub-type="epub">
<day>18</day>
<month>12</month>
<year>2018</year>
</pub-date>
<pub-date pub-type="collection">
<year>2018</year>
</pub-date>
<volume>9</volume>
<elocation-id>1833</elocation-id>
<history>
<date date-type="received">
<day>08</day>
<month>09</month>
<year>2018</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>12</month>
<year>2018</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2018 Zhang, Zhang, Yuan, Dong, Li, Guo, Wang, Deng, Chen and Lin.</copyright-statement>
<copyright-year>2018</copyright-year>
<copyright-holder>Zhang, Zhang, Yuan, Dong, Li, Guo, Wang, Deng, Chen and Lin</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Amphioxus, or cephalochordates, are often used as the living invertebrate proxy of vertebrate ancestors and are widely used as evolutionary biology models of chordates. However, their phylogeny, divergence history, and speciation characteristics remain poorly understood, and phylogenomic studies to explore these problems lacking entirely from the literature. Here, we determined a new transcriptome of <italic>Branchiostoma japonicum</italic>. Combined with mass sequences of all other 18 species, a 19-way phylogeny was constructed via multiple methods (ML, BI, PhyloBayes, and ASTRAL), consistently supporting a phylogeny of [(<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) + (<italic>B. lanceolatum</italic> + <italic>B. floridae</italic>) + <italic>Asymmetron lucayanum</italic>] in amphioxus. Congruent phylogenetic signals were found across mitochondrial genes, 12S RNA, and complete mitochondrial genomes according to previous reports, indicating that 12S RNA may have potential as a molecular marker for phylogenetic analysis in amphioxus. Molecular dating analysis indicated a radiation of the cephalochordates during the Cretaceous (&#x223C;104-61 million years ago), supporting an association between the diversification and speciation of cephalochordates with continental drift and associated changes in their respective habitats during this time. The identified functional enrichment analysis for species-specific domains indicated that their function mainly involves immune response, apoptosis, and lipid metabolism and utilization, signaling that pathogens and changes of energy requirements are an important driving force for amphioxus speciation. This study represents the first large-scale phylogenomic analysis of most major amphioxus genera based on phylogenomic data, providing a new perspective on both phylogeny and divergence speciation of cephalochordates.</p>
</abstract>
<kwd-group>
<kwd>Cephalochordata</kwd>
<kwd>amphioxus</kwd>
<kwd>phylogenomics</kwd>
<kwd>divergence history</kwd>
<kwd>speciation process</kwd>
<kwd>protein domains</kwd>
<kwd>evolutionary genomics</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content></contract-sponsor>
<contract-sponsor id="cn002">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content></contract-sponsor>
<counts>
<fig-count count="4"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="63"/>
<page-count count="13"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec><title>Introduction</title>
<p>Amphioxus, also known as lancelets, belongs to Leptocardii: Amphioxiformes and is the only modern representative of the subphylum Cephalochordata (<xref ref-type="bibr" rid="B26">Koop and Holland, 2008</xref>). Amphioxus is a key topic for investigations of evolutionary biology as they provide indications about the evolutionary origins of vertebrates, and provide an intriguing comparison point to trace how vertebrates have evolved and adapted (<xref ref-type="bibr" rid="B51">Shimeld and Holland, 2005</xref>; <xref ref-type="bibr" rid="B43">Putnam et al., 2008</xref>). Despite the separate evolution of cephalochordate and vertebrates from a common ancestor more than 520 million years ago (Mya), their body structure and morphology maximally retained characteristics of these vertebrate ancestors (<italic>Haikouella lanceolata</italic>) (<xref ref-type="bibr" rid="B6">Chen et al., 1999</xref>). With the recent accumulation of genetic data on amphioxus, the molecular phylogeny, evolutionary developmental biology (evo&#x2013;devo), and genomics further suggest amphioxus as a valid model of vertebrate ancestry (<xref ref-type="bibr" rid="B51">Shimeld and Holland, 2005</xref>; <xref ref-type="bibr" rid="B43">Putnam et al., 2008</xref>). The amphioxus of today is the only living cephalochordates and is distributed in three genera: <italic>Branchiostoma</italic> (&#x223C;28 species) with the largest number, <italic>Epigonichthys</italic> (one species), and <italic>Asymmetron</italic> (one species). However, additional cryptic species might exist (<xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). <italic>Branchiostoma</italic> widely distributed in the mid-low latitudes of the Atlantic Ocean, the Mediterranean, and the Pacific Ocean, with the remaining two genera primarily distributed in the mid-low latitudes and tropics along the equatorial zone. The habitat of amphioxus can be found in shallow coastal seawater at a depth of 8&#x2013;16 m, and the animals hide most of their bodies in the fine sand of the seafloor, finding their food via filter-feeding of the seawater.</p>
<p>Despite the important role of amphioxus in evolutionary biology, publications investigating the molecular phylogeny within amphioxus are few, especially in recent years. In contrast, many studies focus on scientific questions involving evolutionary biology and molecular phylogeny between amphioxus and vertebrates, which leads to a bias in our knowledge of amphioxus evolution. Previous studies of the last decade focused on amphioxus taxonomy and species divergence based on mitochondrial genomics (mitochondrial DNA, mtDNA). For example, <xref ref-type="bibr" rid="B33">Luo et al. (2007)</xref> used the cytochrome c oxidase subunit 1 (<italic>cox1</italic>) and cytochrome b subunit (<italic>cob</italic>) gene fragments to construct phylogenetic trees among <italic>Branchiostoma belcheri, B. japonicum</italic>, and <italic>B. tsingtaoensis</italic>, and calculated average genetic distance among them. The results showed a clustered clade and intraspecific differences between <italic>B. japonicum</italic> and <italic>B. tsingtaoensis</italic>, supporting the classification of <italic>B. tsingtaoensis</italic> as <italic>B. japonicum</italic>. Zhong et al. (2009) sequenced the complete mtDNA of both <italic>B. japonicum</italic> and <italic>B. belcheri</italic> and combined the results with the reported 13 protein-coding genes (PCGs) of mtDNA from five other species of amphioxus to construct a maximum likelihood (ML) tree of protein and nucleic acid sequences, respectively. Both phylogenetic trees supported the results of <xref ref-type="bibr" rid="B33">Luo et al. (2007)</xref>; moreover, the results of these investigations indicated that amphioxus living in Beihai, Guangxi province and Maoming, Guangdong province belongs to the same species <italic>B. belcheri</italic> (Zhong et al., 2009). Furthermore, Zhong et al. (2009) further constructed a phylogenetic tree containing different geographical populations of amphioxus based on the 12S rRNA (ribosomal RNA) sequence of mtDNA. It is worth noting that the tree constructed by 13 PCGs supported the following topological structure: ((((<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) + <italic>Branchiostoma lanceolatum</italic>) + <italic>Branchiostoma floridae</italic>) + <italic>Asymmetron</italic>), while the 12S rRNA-based tree did not support <italic>B. lanceolatum</italic> as a sister lineage of the (<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) clade instead of <italic>B. floridae</italic>, namely [(<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) + (<italic>B. lanceolatum</italic> + <italic>B. floridae</italic>) + <italic>Asymmetron</italic>]. This inconsistency may be caused by limited sequence site information and use of improper molecular markers (Zhong et al., 2009). <xref ref-type="bibr" rid="B25">Kon et al. (2007)</xref> found the new species of amphioxus <italic>Asymmetron inferum</italic>, near whale corpses on the seafloor at a depth of 229m (Nommisaki cape, southwest of Kyushu island, Japan) and used the complete mtDNA of eight amphioxus species (including three other species as outgroups) to reconstruct their Bayesian (BI), ML, and maximal parsimony (MP) trees. The topology was consistent with that constructed via 12S rRNA, rather than that based on 13 PCGs by Zhong et al. (2009). The phylogenetic relationship among these four <italic>Branchiostoma</italic> species thus remained unclear and this divergence caused by various mtDNA genes still requires clarification.</p>
<p>Molecular dating based on phylogenetic tree was widely investigated within amphioxus species. <xref ref-type="bibr" rid="B25">Kon et al. (2007)</xref> estimated the divergence time of eight amphioxus species using molecular dating methods, showing that <italic>Asymmetron</italic> and <italic>Branchiostoma</italic> genera split from their common ancestor (<italic>Asymmetron</italic> &#x2013; <italic>Branchiostoma</italic>) about 240 Mya, and <italic>B. belcheri</italic> &#x2013; <italic>B. floridae</italic> about 130 Mya. However, more recently, <xref ref-type="bibr" rid="B62">Yue et al. (2014)</xref> constructed a ML tree of 15 species based on 427 orthologs using transcriptomic and genomic data and including two amphioxus species (<italic>B. floridae</italic> and <italic>A. lucayanum</italic>). They suggested a divergence time of <italic>Asymmetron</italic> &#x2013; <italic>Branchiostoma</italic> of about 120 Mya. <xref ref-type="bibr" rid="B19">Huang et al. (2014)</xref> performed genome sequencing of <italic>B. belcheri</italic> (reporting the second amphioxus genome after that of <italic>B. floridae</italic>) and estimated the divergence times of 15 species based on 513 orthologs from the genomic sets; their data covered the two amphioxus species, <italic>B. floridae</italic> and <italic>B. belcheri</italic>, which predicted 130 Mya as the divergence time between them. So far, phylogenetic trees containing multiple amphioxus species have been investigated based on mtDNA; however, those recently constructed by large-scale transcriptomic and genomic data contained only two amphioxus species (no more than two species). Therefore, it is necessary to reconstruct a phylogenetic tree containing multiple amphioxus species and to calculate the divergence time frame at the omics level to further uncover the divergence history and to alleviate the contradictions among previous investigations.</p>
<p>Additionally, previous investigations performed a direct comparison of the domain diversity between amphioxus and other model vertebrates, identifying amphioxus-specific protein domains from <italic>B. belcheri</italic> and <italic>B. floridae</italic> (<xref ref-type="bibr" rid="B19">Huang et al., 2014</xref>). Nevertheless, lineage-specific domains among multiple amphioxus species and their biological function remain largely unknown, which obstructs our understanding of the characteristics of amphioxus speciation.</p>
<p>Here, we sequenced the transcriptome of adult <italic>B. japonicum</italic>, and assembled, respectively, it and <italic>A. Lucayanum</italic> transcriptome. Combined with the whole-genome gene set for the other 16 species and the transcriptome of <italic>B. lanceolatum</italic>, we performed large-scale comparative analyses to reconstruct the phylogenetic tree and estimate divergence times among cephalochordates. Moreover, species-specific and ancestral domains were identified among amphioxus and functional enrichment analyses were performed for each target domain set.</p>
</sec>
<sec id="s1" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec><title>Ethics Statement</title>
<p>This study was carried out in accordance with the recommendations of the Guide for the Care and Use of Laboratory Invertebrate Animals. The protocol was approved by the Ethical Committee of Researches of the Nanjing University (NJU).</p>
</sec>
<sec><title>Materials and RNA Sequencing</title>
<p>Adult species of <italic>B. japonicum</italic> were collected from Qingdao, Shandong province, China, and kept in laboratory for 5 days to facilitate emptying of the digestive tract. Total RNA was isolated from several male and females using the TRIzol reagent (Invitrogen, United States), and genomic DNA was removed by RNase-Free DNase Set (Qiagen, Germany) according to the manufacturer&#x2019;s instructions. RNA quality was determined using Bioanalyser 2100 (Agilent, United States), and the concentration was measured using the NanoDrop 1000 (Thermo Scientific, United States). Standard cDNA libraries were constructed using standard Illumina libraries prep protocols and TruSeq kit (Illumina, United States). After homogenization treatment of sequencing libraries, RNA sequencing (RNA-seq) was conducted on an Illumina HiSeq<sup>TM</sup> 2000 with 100-bp paired-end reads. RNA-seq was performed in BGI (Shenzhen, China).</p>
</sec>
<sec><title>Assembly of Reads, Correction of Gene Models, and Functional Annotation</title>
<p>We firstly used FastQC (<xref ref-type="bibr" rid="B4">Brown et al., 2017</xref>) to control the quality of the raw sequencing reads by checking for over-represented and potentially contaminant sequences following stringent criteria: (1) reads with adaptors were discarded; (2) reads with unknown bases > 10% were discarded; (3) reads with a length &#x003C; 20 bp were discarded. We used the program Sickle to remove or trim low-quality reads [percentage of low-quality bases (bases with sequencing quality score &#x2264; 5) > 50%] (<xref ref-type="bibr" rid="B5">Cabili et al., 2011</xref>). Quality paired-end reads (clean reads) were obtained and then used to assemble the transcriptome using Trinity (<xref ref-type="bibr" rid="B13">Grabherr et al., 2011</xref>). In addition, we obtained clean reads of a further adult amphioxus (<italic>A. lucayanum</italic>) (Accession: SRX437621) from the Sequence Read Archive (SRA) database of the NCBI, and assembled its transcriptome following the above pipelines. Trinity can detect potential isoforms from alternative splicing and label them with the same prefix. For multiple isoforms, the longest unigene was selected from each isoform group as a unique representation for that group. We also downloaded the <italic>B. lanceolatum</italic> transcriptome from the NCBI Transcriptome Shotgun Assembly (TSA) database (Accession numbers: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="JT846176">JT846176</ext-link>-<ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="JT905674">JT905674</ext-link>) (<xref ref-type="bibr" rid="B52">Silvan et al., 2012</xref>). Potential coding sequences (CDSs) of three amphioxus species were predicted via Blastx (default parameter) (<xref ref-type="bibr" rid="B39">Mount, 2007</xref>) search of the NCBI non-redundant (NR) protein database. The optimal alignment was extracted as template for the determination of the CDSs of unigenes. Then, ESTScan (<italic>E</italic>-value = 10<sup>-5</sup>) (<xref ref-type="bibr" rid="B20">Iseli et al., 1999</xref>) software was used to predict the CDS of unigenes that failed to produce any hit.</p>
<p>The protein, mRNA, and CDS sequences of 16 sampled species with sequenced genome were retrieved from online databases (see <bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM4">S1</xref></bold> for details). Among these genomic sequences, the CDS and protein sequence of 15 species (except for <italic>A. mississippiensis</italic>) could not be completely matched, thus they were corrected. First, CDS sequences below 120 bp were removed; then, protein sequences were aligned to mRNA using Exonerate software (<xref ref-type="bibr" rid="B15">Guy and Birney, 2005</xref>). Based on amino acid-nucleic acid alignments, incompatible CDS and protein sequences were corrected, discarding uncorrected sequences. For the protein sequences translated from corrected CDSs, we used the Blastp tool to search for them in Nr, Swiss-Prot, and gene ontology (GO) databases (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>), respectively, performing functional annotation of all genes or unigenes.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Summary statistics for sequencing, assembly, and annotation of transcriptomes.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left"></td>
<th valign="top" align="center"><italic>B. japonicum</italic></th>
<th valign="top" align="center"><italic>A. lucayanum</italic></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Raw reads</td>
<td valign="top" align="center">&#x223C;52 million</td>
<td valign="top" align="center">&#x223C;146 million</td></tr>
<tr>
<td valign="top" align="left">Clean reads</td>
<td valign="top" align="center">&#x223C;49 million</td>
<td valign="top" align="center">&#x223C;135 million</td>
</tr>
<tr>
<td valign="top" align="left">Q20 percentage</td>
<td valign="top" align="center">97.09%</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">N50 (bp)</td>
<td valign="top" align="center">1,753</td>
<td valign="top" align="center">1,797</td>
</tr>
<tr>
<td valign="top" align="left">Number of final unigenes</td>
<td valign="top" align="center">92,003</td>
<td valign="top" align="center">112,753</td>
</tr>
<tr>
<td valign="top" align="left">Number of CDSs</td>
<td valign="top" align="center">50,316</td>
<td valign="top" align="center">42,148</td>
</tr>
<tr>
<td valign="top" align="left">NR</td>
<td valign="top" align="center">46,540</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">Swiss-Prot</td>
<td valign="top" align="center">31,941</td>
<td valign="top" align="center">/</td>
</tr>
<tr>
<td valign="top" align="left">GO</td>
<td valign="top" align="center">30,319</td>
<td valign="top" align="center">/</td></tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec><title>Construction of Orthologous Alignments</title>
<p>HaMSTR (<xref ref-type="bibr" rid="B9">Ebersberger et al., 2009</xref>) and reciprocal best hits (BRH) (<xref ref-type="bibr" rid="B38">Moreno-Hagelsieb and Latimer, 2008</xref>) methods are generally used for the construction of orthologous genes. The results obtained from HaMSTR and BRH methods were intersected as a final ortholog set of 19 sampled species, to avoid bias caused by using a single method only. For the HaMSTR approach, according to previous description in transcriptomic analyses (<xref ref-type="bibr" rid="B37">Misof et al., 2014</xref>; <xref ref-type="bibr" rid="B30">Li et al., 2015</xref>), a set of core-orthologs was constructed from nine vertebrate genomes including human (<italic>Homo sapiens</italic>), mouse (<italic>Mus musculus</italic>), chicken (<italic>Gallus gallus</italic>), zebrafish (<italic>Danio rerio</italic>), Coelacanth (<italic>Latimeria chalumnae</italic>), fugu (<italic>Takifugu rubripes</italic>), elephant shark (<italic>Callorhinchus milii</italic>), lamprey (<italic>Petromyzon marinus</italic>), and Western clawed frog (<italic>Xenopus tropicalis</italic>). All 6,793 one-to-one core-orthologous proteins were obtained from the OrthDB v9.1 database (<xref ref-type="bibr" rid="B27">Kriventseva et al., 2015</xref>) and were inputted into the multiple alignment tool Muscle (v3.8) (<xref ref-type="bibr" rid="B10">Edgar, 2004</xref>) using default sets. Then, a hidden Markov model &#x201C;primer taxa&#x201D; was built from the multiple alignment of the core-orthologs using the hmmbuild tool of the HMMER3 package (<xref ref-type="bibr" rid="B11">Finn et al., 2011</xref>). The &#x201C;primer taxa&#x201D; served as input to produce the core-ortholog database for the program HaMStR v.13.2.6 (<xref ref-type="bibr" rid="B9">Ebersberger et al., 2009</xref>) to search for the corresponding orthologs in the remaining 10 species. If one species contained multiple corresponding orthologs in co-orthologous, only the optimal hit was retained. HaMStR v.13.2.3 was run using strict parameters (-sequence file, -est, -hmmset, -refspec, -representative, and -ublast) according to a previous description (<xref ref-type="bibr" rid="B30">Li et al., 2015</xref>). Furthermore, Proteinortho (v5.13) (<italic>E</italic>-value = 10<sup>-10</sup>) (<xref ref-type="bibr" rid="B29">Lechner et al., 2011</xref>), software compiled based on the BRH method that is widely used for large-scale comparative genomic analysis, was employed to identify co-orthologous among all 19 species. The PhyloTreePruner pipeline was employed to pick the unique representative for each species in co-orthologous based on the gene tree (<xref ref-type="bibr" rid="B23">Kocot et al., 2013</xref>). According to the gene labels, the obtained orthologous gene groups were collectively included in the results from HaMSTR and BRH methods. All orthologous genes, including protein and CDS sequences, were aligned using the Prank tool (&#x201C;-codon&#x201D; option) (<xref ref-type="bibr" rid="B32">L&#x00F6;ytynoja and Goldman, 2005</xref>), and then further trimmed via Gblocks (<xref ref-type="bibr" rid="B56">Talavera and Castresana, 2007</xref>) with the parameter &#x201C;-t = c&#x201D; to remove poorly aligned regions. Trimmed alignments that contained shorter than 60 bp/20 amino acids were removed.</p>
</sec>
<sec><title>Phylogenetic Analysis</title>
<p>Concatenated alignments used for the construction of the phylogenetic tree were constructed from all orthologs using the FasParser package (<xref ref-type="bibr" rid="B54">Sun, 2017</xref>). The best amino acid substitution model was identified for the further phylogenetic analysis using ProtTest (v3.4) (<xref ref-type="bibr" rid="B1">Abascal et al., 2005</xref>). The LG+I+G+F model was recommended as the best model based on both the Akaike information criterion (AIC) and Bayesian information criterion (BIC). Phylogenetic analyses were conducted for all aligned protein dataset using site-homogeneous (ML and Bayes) and -heterogeneous models (PhyloBayes). RAxML 7.0.4 (<xref ref-type="bibr" rid="B14">Guindon et al., 2010</xref>) was used to constructed ML trees, and 1000 bootstraps (BS) were used to estimate node reliability. The Bayesian phylogenetic tree was reconstructed using MrBayes 3.2.2 (<xref ref-type="bibr" rid="B46">Ronquist et al., 2012</xref>). In MrBayes analysis, the LG model was not available; thus, the JTT+I+G+F model was used as the secondary best choice (<xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). Two independent runs with four chains (three heated and one cold) were conducted concurrently for 1,000,000 generations, sampling every 100 generations. When the estimated sample size (ESS) value exceeded 100 and the potential scale reduction factor (PSRF) was close to 1.0, stationarity was considered to be reached, as recommended by the MrBayes software (<xref ref-type="bibr" rid="B46">Ronquist et al., 2012</xref>). Next, the first 25% samples were discarded as burn-in, and the branch lengths and posterior probabilities (PP) were calculated in a consensus tree. Bayesian analyses with a site-heterogeneous model were implemented using PhyloBayes 4.1b (<xref ref-type="bibr" rid="B28">Lartillot et al., 2013</xref>). After the removal of constant sites from the alignment, two independent chains, starting from a random tree, were run under the CAT-GTR model.</p>
<p>Next, we also used ASTRAL II, a statistically consistent algorithm to estimate the species tree topology under the multi-species coalescent model (<xref ref-type="bibr" rid="B36">Mirarab et al., 2016</xref>). Support values were obtained by calculating the local posterior probability, a advantage of ASTRAL II that presented high precision compared to multi-locus bootstrapping on a wide set of simulated and biological datasets (<xref ref-type="bibr" rid="B49">Sayyari and Mirarab, 2016</xref>). We conducted the analysis without the &#x201C;species map&#x201D; set, which means that it is unnecessary to assign multiple individuals to the same species to one taxon. Species tree obtained from RAxML gene trees of each of the 3070 orthologous loci, summarized with ASTRAL II. As species tree analyses do not require outgroups (<xref ref-type="bibr" rid="B17">Heled and Drummond, 2009</xref>), all 19 species thus were included as ingroups in the ASTRAL II analyses.</p>
</sec>
<sec><title>Estimation of Divergence Time</title>
<p>Based on the ML tree reconstructed above, Bayesian estimation was performed for the divergence time of the sampled 19 species to construct a time frame of cephalochordate evolution. The nine divergence nodes were signed as calibration points according to previously summarized fossil records (<xref ref-type="bibr" rid="B3">Benton and Donoghue, 2007</xref>; <xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). A calibration point (520.00&#x2013;? Mya) from our early research was used at Olfactores (n) (<xref ref-type="bibr" rid="B6">Chen et al., 1999</xref>). In molecular dating analysis, a safe upper bound for the root age is essential in Markov chain Monte Carlo Tree (MCMCTree). Since no reliable fossil record exists that could be used here, the secondary calibration approach was used to obtain the root age (q, Deuterostomia). Currently, the divergence time at the Deuterostomia node was estimated based on the tree with the root node of Bilateria (Deuterostomia+Mollusca) via molecular clock. However, various values have been reported for the maximum constraints of the crown bilaterian divergence time, including 581.5 Mya (<xref ref-type="bibr" rid="B3">Benton and Donoghue, 2007</xref>), and 640&#x2013;730 Mya (<xref ref-type="bibr" rid="B41">Peterson et al., 2008</xref>). <xref ref-type="bibr" rid="B62">Yue et al. (2014)</xref> explored the divergence time of crown bilaterian via MCMCTree analysis, including well-described fossil calibrations, under fixed root lower bounds (531.50) and a variety of upper bounds (600, 700, 800, and 900 Mya). Then, the authors proposed that 600 and 700 Mya were reliable and calculated their respective divergence time of Deuterostomia based on both calibration constraints (resulting in 532.67&#x2013;598.27 and 585.50&#x2013;698.50 Mya) (<xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). Consequently, we employed both results as different secondary calibration dates for the Deuterostomia (q) node in the current investigations. All calibration constraints of divergence nodes are presented in <bold>Table <xref ref-type="table" rid="T2">2</xref></bold>.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Bayesian MCMC and R8S estimations for the divergence time of each internal node shown in <bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>, assuming that the Deuterostomia divergence (root calibration constraints) occurred at [532.67, 598.27] Mya.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="left"></td>
<th valign="top" align="left">Calibration constraints<hr/></th>
<th valign="top" align="center" colspan="2">MCMCTREE<hr/></th>
<th valign="top" align="center" colspan="2">R8S<hr/></th></tr>
<tr>
<th valign="top" align="left">Node index</th>
<th valign="top" align="left">Node name</th>
<th valign="top" align="center">[min, max] (Mya)</th>
<th valign="top" align="center">Mean (Mya)</th>
<th valign="top" align="center">95% CI (Mya)</th>
<th valign="top" align="center">Mean (Mya)</th>
<th valign="top" align="center">95% CI (Mya)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">a</td>
<td valign="top" align="left">Eutheria</td>
<td valign="top" align="center">[61.50, 100.50]</td>
<td valign="top" align="center">76.49</td>
<td valign="top" align="center">[60.91&#x2013;99.43]</td>
<td valign="top" align="center">71.65</td>
<td valign="top" align="center">[56.72&#x2013;97.68]</td>
</tr>
<tr>
<td valign="top" align="left">b</td>
<td valign="top" align="left">Amniote</td>
<td valign="top" align="center">[312.30, 330.40]</td>
<td valign="top" align="center">318.63</td>
<td valign="top" align="center">[312.00&#x2013;329.34]</td>
<td valign="top" align="center">312.67</td>
<td valign="top" align="center">[301.47&#x2013;326.36]</td>
</tr>
<tr>
<td valign="top" align="left">c</td>
<td valign="top" align="left">Ankylopoda</td>
<td valign="top" align="center">[259.70, 299.80]</td>
<td valign="top" align="center">268.28</td>
<td valign="top" align="center">[258.33&#x2013;291.27]</td>
<td valign="top" align="center">257.36</td>
<td valign="top" align="center">[253.21&#x2013;284.63]</td>
</tr>
<tr>
<td valign="top" align="left">d</td>
<td valign="top" align="left">Archosauriformes</td>
<td valign="top" align="center">[235.00, 250.40]</td>
<td valign="top" align="center">244.31</td>
<td valign="top" align="center">[235.42&#x2013;250.63]</td>
<td valign="top" align="center">246.28</td>
<td valign="top" align="center">[237.34&#x2013;249.69]</td>
</tr>
<tr>
<td valign="top" align="left">e</td>
<td valign="top" align="left">Tetrapoda</td>
<td valign="top" align="center">[330.40, 350.10]</td>
<td valign="top" align="center">343.13</td>
<td valign="top" align="center">[331.80&#x2013;350.42]</td>
<td valign="top" align="center">344.07</td>
<td valign="top" align="center">[331.78&#x2013;351.51]</td>
</tr>
<tr>
<td valign="top" align="left">f</td>
<td valign="top" align="left">Sarcopterygii</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">382.15</td>
<td valign="top" align="center">[354.82&#x2013;407.11]</td>
<td valign="top" align="center">367.22</td>
<td valign="top" align="center">[333.78&#x2013;398.61]</td>
</tr>
<tr>
<td valign="top" align="left">g</td>
<td valign="top" align="left">Osteichthyes</td>
<td valign="top" align="center">[416.00, 421.75]</td>
<td valign="top" align="center">418.68</td>
<td valign="top" align="center">[416.02&#x2013;421.73]</td>
<td valign="top" align="center">424.82</td>
<td valign="top" align="center">[418.13&#x2013;431.44]</td>
</tr>
<tr>
<td valign="top" align="left">h</td>
<td valign="top" align="left">Acanthopterygii</td>
<td valign="top" align="center">[149.85, 165.20]</td>
<td valign="top" align="center">157.36</td>
<td valign="top" align="center">[149.81&#x2013;165.20]</td>
<td valign="top" align="center">152.92</td>
<td valign="top" align="center">[146.65&#x2013;166.62]</td>
</tr>
<tr>
<td valign="top" align="left">i</td>
<td valign="top" align="left">Gnathostomata</td>
<td valign="top" align="center">[412.75, 462.50]</td>
<td valign="top" align="center">443.11</td>
<td valign="top" align="center">[420.23&#x2013;461.68]</td>
<td valign="top" align="center">448.65</td>
<td valign="top" align="center">[413.27&#x2013;477.76]</td>
</tr>
<tr>
<td valign="top" align="left">j</td>
<td valign="top" align="left">Vertebreta</td>
<td valign="top" align="center">[460.60, &#x2013;]</td>
<td valign="top" align="center">494.47</td>
<td valign="top" align="center">[460.94&#x2013;532.75]</td>
<td valign="top" align="center">471.19</td>
<td valign="top" align="center">[452.53&#x2013;498.87]</td>
</tr>
<tr>
<td valign="top" align="left">k</td>
<td valign="top" align="left">Olfactores</td>
<td valign="top" align="center">[520.00, &#x2013;]</td>
<td valign="top" align="center">548.41</td>
<td valign="top" align="center">[513.66&#x2013;579.60]</td>
<td valign="top" align="center">525.77</td>
<td valign="top" align="center">[504.49&#x2013;546.35]</td>
</tr>
<tr>
<td valign="top" align="left">l</td>
<td valign="top" align="left">Chordata</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">577.52</td>
<td valign="top" align="center">[544.32&#x2013;597.51]</td>
<td valign="top" align="center">546.06</td>
<td valign="top" align="center">[502.15&#x2013;588.26]</td>
</tr>
<tr>
<td valign="top" align="left">m</td>
<td valign="top" align="left">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">61.11</td>
<td valign="top" align="center">[9.93&#x2013;128.65]</td>
<td valign="top" align="center">64.23</td>
<td valign="top" align="center">[12.58&#x2013;123.75]</td>
</tr>
<tr>
<td valign="top" align="left">n</td>
<td valign="top" align="left">Branchiostomidae</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">86.83</td>
<td valign="top" align="center">[39.98&#x2013;149.47]</td>
<td valign="top" align="center">91.11</td>
<td valign="top" align="center">[32.84&#x2013;162.85]</td>
</tr>
<tr>
<td valign="top" align="left">o</td>
<td valign="top" align="left">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">72.42</td>
<td valign="top" align="center">[30.50&#x2013;140.35]</td>
<td valign="top" align="center">78.64</td>
<td valign="top" align="center">[34.22&#x2013;143.95]</td>
</tr>
<tr>
<td valign="top" align="left">p</td>
<td valign="top" align="left">Cephalochordata</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">104.37</td>
<td valign="top" align="center">[21.25&#x2013;191.35]</td>
<td valign="top" align="center">112.09</td>
<td valign="top" align="center">[28.80&#x2013;193.76]</td>
</tr>
<tr>
<td valign="top" align="left">q</td>
<td valign="top" align="left">Deuterostomia</td>
<td valign="top" align="center">[532.67, 598.27]</td>
<td valign="top" align="center">587.14</td>
<td valign="top" align="center">[557.15&#x2013;601.25]</td>
<td valign="top" align="center">569.53</td>
<td valign="top" align="center">[543.25&#x2013;589.17]</td>
</tr>
<tr>
<td valign="top" align="left">r</td>
<td valign="top" align="left">Ambulacraria</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">569.65</td>
<td valign="top" align="center">[461.45&#x2013;629.35]</td>
<td valign="top" align="center">547.27</td>
<td valign="top" align="center">[414.91&#x2013;601.75]</td></tr>
</tbody>
</table>
</table-wrap>
<p>Molecular dating analysis was conducted using the MCMCTree subprogram of the PAML package (v4.8) with the concatenated gene matrix used in the phylogenetic analysis (<xref ref-type="bibr" rid="B8">Dos and Yang, 2011</xref>). As fixed topology from the guide tree, we first obtained the ML estimates of the branch lengths, the gradient (G) vector, and the Hessian (H) matrix using the codeml from the PAML package (v4.8) (<xref ref-type="bibr" rid="B8">Dos and Yang, 2011</xref>), then, these estimated values were fed into control files of MCMCTree together with the LG substitution model. We set a time unit of 1 million years, and used the same gamma prior G(1, 100) to specify the substitution rate and rate drift parameters. An autocorrelated and lognormal relaxed clock model (<xref ref-type="bibr" rid="B44">Rannala and Yang, 2007</xref>) was used to estimate the posterior distribution of the divergence time, given these priors. The burn-in for the MCMC chain was run 10,000,000 generations, with sampling parameters every 1,000 generations. Two independent runs were conducted to ensure convergence of MCMC chains. The program summarized the mean and the 95% confidence intervals (CIs).</p>
<p>The penalized-likelihood (PL) approach was used in the program r8s V1.8 (<xref ref-type="bibr" rid="B48">Sanderson, 2003</xref>), in combination with the truncated-Newton algorithm (<xref ref-type="bibr" rid="B47">Sanderson, 2002</xref>). The cross-validation method in r8s was used to determine the optimal level of rate-smoothing of the PL analyses with smoothing parameters varying from 1 to 1,000 according to a previously described procedure (<xref ref-type="bibr" rid="B40">Mulcahy et al., 2012</xref>). The optimal smoothing parameter (<italic>S</italic> = 100) was first determined using the same fixed topology (ML) used as input for MCMCTree, since there is evidence that branch lengths are more accurately estimated by ML than by BI methods (<xref ref-type="bibr" rid="B50">Schwartz and Mueller, 2010</xref>). CIs for the PL age estimates were obtained by replicating PL analyses of 1,000 trees. The mean divergence time and 95% CIs were summarized using the r8s bootstrap kit.</p>
</sec>
<sec><title>Analysis of Molecular Evolution</title>
<p>To identify the domains contained in the protein sequences for all amphioxus, the amino acid sequence sets of five species of amphioxus were searched in Pfam-A database 31.0 using local HMMER 3.1<sup><xref ref-type="fn" rid="fn01">1</xref></sup>. This is the best program for domain identification and it has often been used together with a profile database, such as Pfam (<xref ref-type="bibr" rid="B45">Rekapalli et al., 2009</xref>). The domain ID set of each amphioxus was fed into a Venn Diagram<sup><xref ref-type="fn" rid="fn02">2</xref></sup> to obtain specific and shared domain types among the five investigated species of amphioxus. It is worth pointing out that only <italic>B. belcheri</italic> and <italic>B. floridae</italic> protein sets were generated from the sequenced whole genome, while those of the other three species were obtained from <italic>de novo</italic> assembled adult transcriptomes that contained assembly defects and missing protein sequences. However, a domain type could be contained in a variety of protein sequences and the domain size was short (generally in the range of 40&#x2013;50 amino acids), which effectively avoided bias caused by incomplete species protein sets and <italic>de novo</italic> assembly errors. Domain sequences were annotated to GO databases using the Blastp tool with default <italic>E</italic>-value. GO enrichment analysis for specific and shared domains among all amphioxus was performed via Fisher&#x2019;s exact test, that was implemented in the Blast2GO pipeline (<xref ref-type="bibr" rid="B7">Conesa et al., 2005</xref>). The Benjamini-Hochberg (BH) method was used for false discovery rate (FDR) correction for the Fisher test (FDR threshold values = 0.05). The list of significant GO terms was further filtered using GO trimming (v2.0) (<xref ref-type="bibr" rid="B22">Jantzen et al., 2011</xref>) to discard redundant terms. Pipeline of primary software used in this study was presented in <bold>Figure <xref ref-type="fig" rid="F1">1A</xref></bold>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p><bold>(A)</bold> Pipeline of primary software used in this study. <bold>(B)</bold> 19-way maximum-likelihood (ML) tree inferred from the concatenated 397 orthologous gene groups. The branch length is proportional to the expected amino acid substitution rate and the scale bar represents 0.08 expected amino acid substitutions per site. Numbers on the internal nodes represent Bayesian posterior probabilities (PP1, left) of MrBayes, bootstrap values (BS, middle) of RAxML, and Bayesian posterior probabilities (PP2, right) of PhyloBayes. An asterisk indicates PP1 = 1.0, BS = 100, and PP2 = 1.0. The Bayesian and PhyloBayes trees are shown in <bold>Supplementary Figures <xref ref-type="supplementary-material" rid="SM1">S1</xref>, <xref ref-type="supplementary-material" rid="SM2">S2</xref></bold>, respectively.</p></caption>
<graphic xlink:href="fphys-09-01833-g001.tif"/>
</fig>
</sec>
</sec>
<sec><title>Results</title>
<sec><title>Sequencing, Assembly, and Annotation</title>
<p>Illumina sequencing for <italic>B. japonicum</italic> generated &#x223C;52 million raw reads. After quality control for the original data, &#x223C;49 million clean reads were obtained, and the Q20 percentage reached 97.09%, indicating a high quality of transcriptome sequencing (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). Clean data have been submitted to the NCBI SRA database: Accession number <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="SRX448311">SRX448311</ext-link>. By Trinity initial assembly, we obtained 161,542 contigs with an N50 value of 816 bp and an average length of 375 bp. Further overlapping clustering for contig sequences, we finally obtained 92,003 unigenes with an N50 value of 1,753 bp and an average length of 785 bp. The assembly results of <italic>A. lucayanum</italic> were nearly consistent with previous reports that originally sequenced its transcriptomes (<xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). Furthermore, we aligned pair-end reads back to unigene sequences of <italic>B. japonicum</italic>, 86.15% clean reads could be completely matched, indicating that the assembly quality meets requirements for subsequent analysis. Based on unigene set obtained, 46,145 and 4,171 CDS sequences were obtained by homologous alignment search and ESTScan detection, respectively. 46,540, 31,941, 30,319 unigenes of <italic>B. japonicum</italic> were annotated into NR, Swiss-Prot, GO database (<bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). For genomic sequences corrected, their CDS sequences are fully identical to their corresponding proteins, ensuring reliability of subsequent analysis. The summary statistics of gene correction are shown in <bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM1">S1</xref></bold>.</p>
</sec>
<sec><title>Amphioxus Evolution Rate and Molecular Phylogeny</title>
<p>To further clarify the phylogenic relationships among amphioxus, we performed a phylogenetic analysis with five species of cephalochordates (<italic>B. belcheri, B. japonicum, B. lanceolatum, B. floridae</italic>, and <italic>A. lucayanum</italic>), 11 vertebrate species (human, mouse, American alligator, green lizard, chicken, western clawed frog, coelacanth, fugu, zebrafish, elephant shark, and lamprey), one urochordate (sea squirt), and two outgroups (acorn worm and sea urchin). A 19-way concatenated multiple protein alignment, based on 397 orthologous gene groups intersected by HaMSTR and BRH methods (442 for HaMSTR and 415 for BRH), was used to construct the phylogenetic tree. Furthermore, the branch length (the expected amino acid substitution rate) was calculated for each species based on ML (<bold>Figure <xref ref-type="fig" rid="F1">1B</xref></bold>), BI (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S1</xref></bold>), and PhyloBayes (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM2">S2</xref></bold>). These three inference methods obtain congruent tree topologies with nearly identical branch lengths (<bold>Figure <xref ref-type="fig" rid="F1">1B</xref></bold>); nodal support values are generally high (PP = 0.95&#x2013;1.0, BS = 86&#x2013;100); moreover, these values are stronger in the BI tree than in the ML tree, as has been previously reported (<xref ref-type="bibr" rid="B59">Yuan et al., 2015</xref>; <xref ref-type="bibr" rid="B60">Yuan et al., 2016</xref>). The species tree estimated by ASTRAL-II is very similar to the tree estimated in the concatenated analysis, with most nodes showing 100% the local posterior probability (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). Regardless of which analyzed method (ML, BI, or PhyloBayes) was used, the branch lengths of all amphioxus except for <italic>B. lanceolatum</italic> were consistently shorter than those of vertebrates, even shorter than that of the elephant shark (<italic>Callorhinchus milii</italic>) as the slowest evolving vertebrate (<xref ref-type="bibr" rid="B57">Venkatesh et al., 2014</xref>). The sea squirt showed the longest branch length in the phylogenetic tree. Interestingly, the branch length of <italic>B. lanceolatum</italic> is longer than those of other amphioxus and vertebrates investigated in this study. Based on this difference in branch length, the amino acid substitution rate of <italic>B. lanceolatum</italic> was assessed to be &#x223C;1.3 times higher than that of fugu (<italic>Takifugu rubripes</italic>) with the fastest evolutionary rate among vertebrates. We conducted Tajima&#x2019;s relative rate test (<xref ref-type="bibr" rid="B55">Tajima, 1993</xref>) based directly on the concatenated protein sequence alignment of pairwise tests between <italic>B. lanceolatum</italic> and fugu, which demonstrated a significant result (<italic>P-</italic>value below 0.05). In addition, the phylogenetic trees consistently support a phylogeny of [(<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) + (<italic>B. lanceolatum</italic> + <italic>B. floridae</italic>) + <italic>A. lucayanum</italic>), regardless of the utilized analytical method.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Results of species tree analyses from 19-species-dataset. Branch support was estimated by computing the local posterior probability.</p></caption>
<graphic xlink:href="fphys-09-01833-g002.tif"/>
</fig>
</sec>
<sec><title>Estimates of Divergence Time Among Amphioxus Species</title>
<p>Based on the ML tree, we performed MCMCTree analysis for the divergence times among all 19 tested species (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). Eleven time constraints were used across the phylogenetic tree (see section &#x201C;Materials and Methods&#x201D;). The Deuterostomia divergence times (root age) were employed as 532.67&#x2013;598.27 and 585.50&#x2013;698.50 Mya, respectively, based on previous investigations (<xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). The results for all age estimates with 95% CI (confidence interval) and mean values are shown in <bold>Tables <xref ref-type="table" rid="T2">2</xref>, <xref ref-type="table" rid="T3">3</xref></bold>. Regardless of which root age we used, the most recent common ancestor of the living amphioxus species (the divergence time between <italic>Asymmetron</italic> and <italic>Branchiostoma</italic>) was estimated to be &#x223C;104 Mya; the early splits within each main clade occurred at &#x223C;87 Mya; <italic>B. lanceolatum</italic> diverged from <italic>B. floridae</italic> at &#x223C;72 Mya, and the divergence time between <italic>B. belcheri</italic> and <italic>B. japonicum</italic> was &#x223C;61 Mya. In addition, to ensure the robustness of estimation results in the divergence time frame, R8S analysis was employed using the same set of time constraints (with a root age of 532.67&#x2013;598.27 Mya) that were used for the MCMCTree estimation. All divergence results with 95% CIs intervals and mean values are shown in <bold>Table <xref ref-type="table" rid="T2">2</xref></bold>. Despite the obviously different divergence times in several nodes, e.g., f, k, q, and r nodes, the r8s analyses overall supported the MCMCTree results, particularly within the cephalochordate. Consequently, the divergence times calculated with the MCMCTree were reliable and were directly used for the further discussion.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Estimates of the divergence time frame of cephalochordate evolution using MCMCTree. The lower-case letters above the lilac bar represent internal node labels (nodes a&#x2013;r). All corresponding time constraints, mean divergence times, and 95% confidence intervals (CI) obtained by the Bayesian estimations are tabulated in <bold>Table <xref ref-type="table" rid="T2">2</xref></bold>. Each lilac bar represents the 95% CI of the corresponding estimate.</p></caption>
<graphic xlink:href="fphys-09-01833-g003.tif"/>
</fig>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Bayesian MCMC estimations for the divergence times of each internal node shown in <bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>, assuming that the Deuterostomia divergence (root calibration constraints) occurred at [585.50&#x2013;698.50] Mya.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center"></td>
<th valign="top" align="center">Calibration</th>
</tr>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center"></td>
<th valign="top" align="center">constraints<hr/></th>
<th valign="top" align="center" colspan="2">MCMCTREE<hr/></th></tr>
<tr>
<th valign="top" align="left">Node</th>
<th valign="top" align="center"></th>
<th valign="top" align="center"></th>
<th valign="top" align="center">Mean</th>
</tr>
<tr>
<th valign="top" align="left">index</th>
<th valign="top" align="center">Node name</th>
<th valign="top" align="center">[Min, Max] (Mya)</th>
<th valign="top" align="center">(Mya)</th>
<th valign="top" align="center">95% CI (Mya)</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">a</td>
<td valign="top" align="center">Eutheria</td>
<td valign="top" align="center">[61.50, 100.50]</td>
<td valign="top" align="center">73.34</td>
<td valign="top" align="center">[60.85&#x2013;98.57]</td>
</tr>
<tr>
<td valign="top" align="left">b</td>
<td valign="top" align="center">Amniote</td>
<td valign="top" align="center">[312.30, 330.40]</td>
<td valign="top" align="center">318.57</td>
<td valign="top" align="center">[311.92&#x2013;329.16]</td>
</tr>
<tr>
<td valign="top" align="left">c</td>
<td valign="top" align="center">Ankylopoda</td>
<td valign="top" align="center">[259.70, 299.80]</td>
<td valign="top" align="center">267.54</td>
<td valign="top" align="center">[257.93&#x2013;290.14]</td>
</tr>
<tr>
<td valign="top" align="left">d</td>
<td valign="top" align="center">Archosauriformes</td>
<td valign="top" align="center">[235.00, 250.40]</td>
<td valign="top" align="center">244.41</td>
<td valign="top" align="center">[235.51&#x2013;250.75]</td>
</tr>
<tr>
<td valign="top" align="left">e</td>
<td valign="top" align="center">Tetrapoda</td>
<td valign="top" align="center">[330.40, 350.10]</td>
<td valign="top" align="center">343.41</td>
<td valign="top" align="center">[332.18&#x2013;350.56]</td>
</tr>
<tr>
<td valign="top" align="left">f</td>
<td valign="top" align="center">Sarcopterygii</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">382.33</td>
<td valign="top" align="center">[356.45&#x2013;406.58]</td>
</tr>
<tr>
<td valign="top" align="left">g</td>
<td valign="top" align="center">Osteichthyes</td>
<td valign="top" align="center">[416.00, 421.75]</td>
<td valign="top" align="center">418.74</td>
<td valign="top" align="center">[416.16&#x2013;421.72]</td>
</tr>
<tr>
<td valign="top" align="left">h</td>
<td valign="top" align="center">Acanthopterygii</td>
<td valign="top" align="center">[149.85, 165.20]</td>
<td valign="top" align="center">157.37</td>
<td valign="top" align="center">[149.85&#x2013;165.11]</td>
</tr>
<tr>
<td valign="top" align="left">i</td>
<td valign="top" align="center">Gnathostomata</td>
<td valign="top" align="center">[412.75, 462.50]</td>
<td valign="top" align="center">447.07</td>
<td valign="top" align="center">[428.73&#x2013;462.66]</td>
</tr>
<tr>
<td valign="top" align="left">j</td>
<td valign="top" align="center">Vertebreta</td>
<td valign="top" align="center">[460.60, &#x2013;]</td>
<td valign="top" align="center">530.01</td>
<td valign="top" align="center">[477.45&#x2013;592.12]</td>
</tr>
<tr>
<td valign="top" align="left">k</td>
<td valign="top" align="center">Olfactores</td>
<td valign="top" align="center">[520.00, &#x2013;]</td>
<td valign="top" align="center">616.81</td>
<td valign="top" align="center">[554.53&#x2013;667.15]</td>
</tr>
<tr>
<td valign="top" align="left">l</td>
<td valign="top" align="center">Chordata</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">662.19</td>
<td valign="top" align="center">[603.55&#x2013;697.00]</td>
</tr>
<tr>
<td valign="top" align="left">m</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">60.93</td>
<td valign="top" align="center">[10.21&#x2013;136.41]</td>
</tr>
<tr>
<td valign="top" align="left">n</td>
<td valign="top" align="center">Branchiostomidae</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">84.92</td>
<td valign="top" align="center">[41.02&#x2013;162.19]</td>
</tr>
<tr>
<td valign="top" align="left">o</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">71.71</td>
<td valign="top" align="center">[31.93&#x2013;149.68]</td>
</tr>
<tr>
<td valign="top" align="left">p</td>
<td valign="top" align="center">Cephalochordata</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">100.11</td>
<td valign="top" align="center">[23.47&#x2013;211.63]</td>
</tr>
<tr>
<td valign="top" align="left">q</td>
<td valign="top" align="center">Deuterostomia</td>
<td valign="top" align="center">[585.50&#x2013;698.50]</td>
<td valign="top" align="center">677.64</td>
<td valign="top" align="center">[628.58&#x2013;709.37]</td>
</tr>
<tr>
<td valign="top" align="left">r</td>
<td valign="top" align="center">Ambulacraria</td>
<td valign="top" align="center">&#x2013;</td>
<td valign="top" align="center">601.93</td>
<td valign="top" align="center">[478.94&#x2013;712.88]</td></tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec><title>Identification and Functional Analysis of Shared and Species-Specific Protein Domains Among Amphioxus Species</title>
<p>Domains are independent functional evolutionary units that can be independently folded (<xref ref-type="bibr" rid="B58">Vogel et al., 2004</xref>); most of them have ancient original history (<xref ref-type="bibr" rid="B21">Itoh et al., 2007</xref>). To investigate the function of ancient and species-specific domains among amphioxus, we firstly retrieved 10,106, 10,708, 8,912, 8,313, and 9,821 domains from <italic>A. lucayanum, B. belcheri, B. floridae, B. lanceolatum</italic>, and <italic>B. japonicum</italic>, respectively, by searching for homologous domains in the Pfam-A database. Among these domains, 4,814 (group 1, G1) were shared between the genera <italic>Asymmetron</italic> and <italic>Branchiostoma</italic> (<bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM3">S3</xref></bold>) and were retained and handed down from their common ancestor.</p>
<p>Furthermore, gene ontology (GO) enrichment analysis for G1 found that 162 enriched GO terms belonging to the &#x201C;biological process&#x201D; subcategory are primarily related to development, cellular process and function, and metabolic processes (<bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM5">S2</xref></bold>). Furthermore, we detected 492 (group 2, G2), 361 (group 3, G3), 427 (group 4, G4), 255 (group 5, G5), and 366 (group 6, G6) species-specific domains in <italic>B. belcheri, B. floridae, B. lanceolatum, B. japonicum</italic>, and <italic>A. lucayanum</italic>, respectively (<bold>Supplementary Tables <xref ref-type="supplementary-material" rid="SM6">S3</xref>&#x2013;<xref ref-type="supplementary-material" rid="SM10">S7</xref></bold>). To examine whether these species-specific domains had biological functionality, we also investigated the enrichment of GO terms for those in each of G2-6 (<bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM11">S8</xref></bold>). Among 21 enriched GO terms in G2 (<italic>B. belcheri</italic>), those associated with the immune, inflammatory, stimulus response, apoptosis, and phagocytosis stood out in particular. For G3 (<italic>B. floridae</italic>), 42 GO terms were enriched, and those associated with development, immunity, and apoptosis were overrepresented. Next, 33 GO terms enriched from G4 (<italic>B. lanceolatum</italic>) were primarily involved in lipid storage and regulation, apoptosis, differentiation and movement of immune cells, and response to stimuli. In G5 (<italic>B. japonicum</italic>), 18 enriched GO terms were primarily related to lipoprotein oxidation and metabolism, antioxidant motions, apoptosis, and immune response. The 37 GO terms enriched in G6 (<italic>A. lucayanum</italic>) were involved in organics and energy metabolism, muscle development, and immunity system process. In general, GO terms involving innate immunity and apoptosis were most commonly enriched by these species-specific domains, follow by GO terms related to lipid metabolism and regulation as well as tissue development, suggesting a central role of these related domains in amphioxus speciation.</p>
</sec>
</sec>
<sec><title>Discussion</title>
<p>This study analyzed large-scale omics data of multiple amphioxus species (>2 species) to estimate their molecular phylogeny. Our phylogenomic analyses, based on the supergene dataset with four analytical methods, including three gene trees and one species tree, obtained a highly supported phylogeny of [(<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) + (<italic>B. lanceolatum</italic> + <italic>B. floridae</italic>) + <italic>A. lucayanum</italic>]. This result was consistent with previous analyses that were based on the 12S rRNA (Zhong et al., 2009) and the whole sequences of mtDNA (<xref ref-type="bibr" rid="B25">Kon et al., 2007</xref>); however, they were incongruent to the results obtained with 13 PCGs, which indicated a phylogenetic relationship of ((((<italic>B. belcheri</italic> +<italic>B. japonicum</italic>) + <italic>B. lanceolatum</italic>) + <italic>B. floridae</italic>) + <italic>A. lucayanum</italic>). This discrepancy is likely caused by varying evolutionary and/or selection pressures, as has been reported for other animals (<xref ref-type="bibr" rid="B16">Havird and Santos, 2014</xref>; <xref ref-type="bibr" rid="B61">Yuan et al., 2018</xref>). Several studies indicated that the phylogenies obtained from transcriptomic, genomic, or complete mtDNA represent the highest phylogenetic performance and allow for better results than phylogenies from single gene and small-scale gene sets (<xref ref-type="bibr" rid="B42">Philippe et al., 2005</xref>; <xref ref-type="bibr" rid="B61">Yuan et al., 2018</xref>). Therefore, the obtained results indicated <italic>B. lanceolatum</italic> as a sister group of <italic>B. floridae</italic>, rather than (<italic>B. belcheri</italic> + <italic>B. japonicum</italic>). These analyses further indicated that 12S rRNA could generate a phylogeny similar to the massive nuclear genes and whole mitogenome, which may thus be used as a potential molecular marker in the phylogeny research of amphioxus. Certainly, this suggestion needs to be further investigated with more amphioxus species. In addition, <xref ref-type="bibr" rid="B62">Yue et al. (2014)</xref> reported a slower evolutionary rate of <italic>B. floridae</italic> and <italic>A. lucayanum</italic>, even compared to the slowest evolving vertebrate known (the elephant shark), and the authors speculated that <italic>Asymmetron</italic> and <italic>Branchiostoma</italic> genera should also be included. Indeed, the newly added amphioxus species <italic>B. belcheri</italic> and <italic>B. japonicum</italic> also showed an extremely slow evolutionary rate, supporting the speculation of <xref ref-type="bibr" rid="B62">Yue et al. (2014)</xref>. However, we found that <italic>B. lanceolatum</italic> is rapidly evolving, even beyond the level of the fastest evolving vertebrate. <italic>B. lanceolatum</italic> (named the Mediterranean amphioxus) is mainly found at the coast of the largest intercontinental sea (the Mediterranean Sea) and in a continental sea (the Black Sea). Due to these relatively closed environments, their terrestrial discharge and unique climate, both regions (particularly the Mediterranean) show exceptionally high biology diversity (<xref ref-type="bibr" rid="B35">Meynard et al., 2012</xref>). Therefore, a relatively closed habitat may be a key factor for driving the rapid evolution of <italic>B. lanceolatum</italic> propelled by its weaker ability to buffer against changing ecological factors. Seawater, warmed by a nuclear power plant since 1980 has been reported to cause rapid evolution of parasite resistance in the European perch of the nearly closed Baltic Sea (<xref ref-type="bibr" rid="B34">Mateosgonzalez et al., 2015</xref>). Additionally, one of the longer branches in the phylogenetic tree is the branch connecting the amphioxus to the other clades. Near to this branch are several of the other longest branches in the phylogeny. This pattern seems to be caused by long-branch attraction (LBA). Nevertheless, four methods used for gene and species tree establishment were employed for construction of phylogenetic tree. Particularly, ML analysis method presented relatively lower possibility to generate LBA (<xref ref-type="bibr" rid="B31">Li et al., 2007</xref>). Concerning the posterior consensus tree, due to Bayesian implementation of site-heterogeneous codon models, CAT-GTR in PhyloBayes seems to be significantly more robust against LBA, compared to all other models (<xref ref-type="bibr" rid="B28">Lartillot et al., 2013</xref>). Furthermore, phylogenetic position of the longer branches was mostly consistent with that reported previously (<xref ref-type="bibr" rid="B19">Huang et al., 2014</xref>; <xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>). Our analysis thus has been avoided LBA as much as possible. Certainly, more comprehensive analysis was required to further reduce LBA possibility in future studies.</p>
<p>The estimation of divergence time is very helpful to understand the speciation event and evolutionary history of amphioxus. The obtained molecular dating results can be substantially influenced by a number of factors, e.g., evolutionary models, methods of analysis, and time constraints (<xref ref-type="bibr" rid="B2">Baele et al., 2012</xref>; <xref ref-type="bibr" rid="B61">Yuan et al., 2018</xref>). This study used multiple methods to estimate the divergence time of amphioxus to avoid the bias of using a single method of analysis only. Additionally, many fossil calibrations (reach 10) and a secondary constraint were used to improve the achieved accuracy of molecular dating. Our age estimation for the main vertebrate groups (slightly older) and the divergence of <italic>Branchiostoma</italic>&#x2013;<italic>Asymmetron</italic> (slightly younger) was mostly consistent with that reported by <xref ref-type="bibr" rid="B62">Yue et al. (2014)</xref>, indicating that our obtained results were robust. Five species of amphioxus showed speciation of no more than &#x223C;47 Mya (nodes p to m), indicating that even though most amphioxus species showed a slow evolutionary rate (<xref ref-type="bibr" rid="B43">Putnam et al., 2008</xref>; <xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>), their speciation process is not as slow as could have been expected, and even exceeds that of most vertebrate groups. Despite the transcriptome of <italic>Epigonichthys</italic>, the third genus of cephalochordates, still being absent, analysis of the complete mtDNA showed a phylogeny relationship of &#x007B;vertebrates + [<italic>Asymmetron</italic> + (<italic>Branchiostoma</italic> + <italic>Epigonichthys</italic>)]&#x007D;, demonstrating that <italic>Asymmetron</italic> diverged earlier than the other two genera in cephalochordates (<xref ref-type="bibr" rid="B25">Kon et al., 2007</xref>). If mass sequences of <italic>Epigonichthys</italic> were added to our analyses, the first divergence time (&#x223C;104 Mya) of living cephalochordates will not become earlier than the current result. Before and at this time, the expansion of the mid-oceanic ridge was driving northward of the African plate according to the Wegener hypothesis of continental drift (<xref ref-type="bibr" rid="B53">Smith, 2014</xref>). The movement divided the common ancestors of <italic>Asymmetron</italic> and <italic>Branchiostoma</italic> into multiple isolated geographical populations. Part of these remained at their home areas along the equator and evolved into the <italic>Asymmetron</italic> ancestor, while others were pushed to a higher altitude and evolved into the <italic>Branchiostoma</italic> ancestor in the Tethys region between the Eurasian and African plates (<bold>Figure <xref ref-type="fig" rid="F4">4A</xref></bold>). The <italic>Asymmetron</italic> distribution primarily along the equator and low latitudes, showing high similarity with their current distribution pattern (<xref ref-type="bibr" rid="B24">Kon et al., 2006</xref>). This further supports the proposed divergence hypothesis between <italic>Asymmetron</italic> and <italic>Branchiostoma</italic>. Furthermore, it is reasonable to speculate that the common ancestor of living cephalochordates likely inhabited areas along the equator and low latitudes. With the northward movement of the African plate toward the Eurasian plate, the <italic>Branchiostoma</italic> ancestors divided into both eastern and western groups in this Tethys region (<bold>Figure <xref ref-type="fig" rid="F4">4B</xref></bold>). Notably, due to the reliable gene communication caused by the largely incomplete closure of the Tethys during this period, we suggest that speciation between both groups remained unfinished until &#x223C;87 Mya. At about 110&#x2013;65 Myr, the Atlantic Ocean gradually opened due to the gradual mid-Cretaceous separation of North America from the Eurasian plate and the breakup of Gondwana (namely Africa and South America). The spread of the Atlantic Ocean constitutes an oceanic barrier due to the enormous depth and width between Europe and the Americas (<xref ref-type="bibr" rid="B12">Frisch and Dawes, 2014</xref>; <xref ref-type="bibr" rid="B18">Hou and Li, 2017</xref>). Therefore, it is likely that western groups diverged into <italic>B. floridae</italic> at the west coast and <italic>B. lanceolatum</italic> at the east coast of the Atlantic Ocean at &#x223C;72 Mya due to the expansion of the Atlantic Ocean (<bold>Figure <xref ref-type="fig" rid="F4">4C</xref></bold>). Similar suggestions have been reported for mollusks and crustaceans (<xref ref-type="bibr" rid="B18">Hou and Li, 2017</xref>). India moved northward from its original position and collided with Asia during the Early Eocene (&#x223C;50 Mya) (<xref ref-type="bibr" rid="B18">Hou and Li, 2017</xref>). A wide eastern region of the Tethys thus remained to be opened &#x223C;61 Mya (<xref ref-type="bibr" rid="B18">Hou and Li, 2017</xref>), and was not divided into the Indian Ocean and the Pacific Ocean. We therefore speculate that the original eastern groups in the Tethys region between the Eurasian and African plates moved east through the region between the Eurasian and Indian plates. Subsequently, part of this moving population likely moved into higher latitudes along the eastern coastline of the Eurasian plate, and speciation of <italic>B. belcheri</italic> and <italic>B. japonicum</italic> happened at &#x223C;61 Mya during this period (<bold>Figure <xref ref-type="fig" rid="F4">4D</xref></bold>). It is likely that divergence of both species was driven by changes of the habitat caused by this difference in latitude. We thus propose that the oceanic evolution driven by platonic movement supplied an important factor for the divergence and speciation of cephalochordates. Consequently, the distribution pattern of living cephalochordates has a close evolutionary relationship with the tectonic structure.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Speciation hypotheses of cephalochordate during Cretaceous and early Cenozoic. <bold>(A)</bold> The African plate moved northward around 104 Mya; the purple oval indicates the common ancestor of existing cephalochordate; the dark green oval indicates the common ancestor of <italic>Branchiostoma</italic>; dark yellow ovals indicate <italic>Asymmetron</italic> ancestors; red dotted arrows indicate divergence and speciation. <bold>(B)</bold> The Africa plate moved northward around 86 Mya; dark blue ovals indicate western groups formed by divergence of the <italic>Branchiostoma</italic> ancestor in the Tethys region between the Eurasian and African plates; pink ovals indicate eastern groups. Continental movement that led to collisions caused the Tethys to shrink further. <bold>(C)</bold> The Atlantic Ocean is widened around 72 Mya; blue ovals indicate <italic>B. floridae</italic> lineage; yellow ovals indicate <italic>B. lanceolatum</italic>. <bold>(D)</bold> Divergence of <italic>B. belcheri</italic> and <italic>B. japonicum</italic> occurred at around 61 Mya; red ovals indicate <italic>B. belcheri</italic> lineage; pale green ovals indicate <italic>B. japonicum</italic>; Eastern groups moved eastward along with the southern margin of the Eurasian plates and speciated in this process.</p></caption>
<graphic xlink:href="fphys-09-01833-g004.tif"/>
</fig>
<p>Comparative domain analysis among different amphioxus species showed no significant difference of the number of domains identified by the whole genomes and transcriptomes. This indicates that domain types (not quantity) of the species were fully obtained through the transcriptome of adult amphioxus. Via GO enrichment analyses, we found that species-specific domains of amphioxus are consistently related to immune response and apoptosis. This result indicates exposure to pathogens in the seawater as a primarily driving force for the origin and evolution of amphioxus domains. This may be furthered by their burying in seafloor sand and relatively poor swimming ability, leading to an accumulation of pathogenic microorganisms. Previous studies reported that rapidly evolving genes between different genera or species of amphioxus were primarily involved in innate immunity (<xref ref-type="bibr" rid="B62">Yue et al., 2014</xref>; <xref ref-type="bibr" rid="B63">Zhang et al., 2018</xref>). This suggests that rapid evolution in sequence played a key role in the evolutionary origin of species-specific domains. Several species of amphioxus possess special capabilities for lipid utilization, particularly<sup><xref ref-type="fn" rid="fn03">3</xref></sup> <italic>B. lanceolatum</italic> (the website of the <italic>B. lanceolatum</italic> genome sequencing project). Our investigations found several GO terms involving lipid storage, metabolism, and regulation in <italic>B. lanceolatum</italic> and <italic>B. japonicum</italic>, perhaps indicating both species as ideal model species for research on the lipid biology of amphioxus. Moreover, this result also indicates species-specific adjustment of energy utilization and production as an important evolutionary step in the speciation history of amphioxus. The common primitive domains of cephalochordates primarily participated in development, cellular process and function, and metabolic process to ensure normal basic biological processes.</p>
<p>In summary, this study represents the first large-scale phylogenomic analysis including most major cephalochordate genera based on transcriptomic data. A phylogeny of [(<italic>B. belcheri</italic> + <italic>B. japonicum</italic>) + (<italic>B. lanceolatum</italic> + <italic>B. floridae</italic>) +<italic>A. lucayanum</italic>], clarifying the phylogenetic position of <italic>B. lanceolatum</italic>. Moreover, we proposed that 12S RNA reported previously mitochondrial genes may be a reliable molecular marker in phylogenetic analyses of cephalochordates. We firstly proposed that the currently living amphioxus species were not an old group, and most likely radiated during the Cretaceous, and their diversification and speciation was driven by primarily the platonic movements during this period. In addition, a batch of species-specific and ancestral protein domains was identified and functionally analyzed among cephalochordates using bioinformatics, indicating several factors that likely promoted the adaptation of amphioxus species to their respective habitats. Our study adds to the understanding of the cephalochordate evolutionary relationships and provides insight into their divergence history and speciation characteristics.</p>
</sec>
<sec><title>Author Contributions</title>
<p>L-BL, J-YC, and Q-LZ conceived and designed the experiments. Q-LZ, G-LZ, M-LY, Z-XD, and H-WL performed the experiments. Q-LZ, M-LY, JG, FW, and X-YD analyzed the data. Q-LZ, L-BL, and J-YC wrote the paper. L-BL, M-LY, and J-YC revised the manuscript.</p>
</sec>
<sec><title>Conflict of Interest Statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> This research was supported by the National Natural Science Foundation of China (31760042 and 41272008) and the program B for Outstanding Ph.D. candidate of Nanjing University (Grant No. 201702B075).</p>
</fn>
</fn-group>
<ack>
<p>We thank Prof. Shi-Cui Zhang from Ocean University of China for offering us <italic>B. japonicum</italic> amphioxus materials.</p>
</ack>
<sec sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fphys.2018.01833/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fphys.2018.01833/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.JPEG" id="SM1" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S1</label>
<caption><p>19-way Bayesian phylogenetic tree inferred from a concatenated orthologous gene matrix. Numbers on branches represent Bayesian posterior probabilities.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.JPEG" id="SM2" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S2</label>
<caption><p>19-way PhyloBayes phylogenetic tree inferred from a concatenated orthologous gene matrix.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_3.JPEG" id="SM3" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>FIGURE S3</label>
<caption><p>Domain venn diagram of five amphioxus species.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_1.XLSX" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S1</label>
<caption><p>Summary statistics of sequence correction.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_2.xlsx" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S2</label>
<caption><p>List of GO terms enriched by genes containing domains that are shared among all tested amphioxus.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_3.xlsx" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S3</label>
<caption><p>Information of lineage-specific domains in <italic>Branchiostoma belcheri</italic>.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_4.xlsx" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S4</label>
<caption><p>Information of lineage-specific domains in <italic>Branchiostoma floridae</italic>.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_5.xlsx" id="SM8" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S5</label>
<caption><p>Information of lineage-specific domains in <italic>Branchiostoma lanceolatum</italic>.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_6.xlsx" id="SM9" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S6</label>
<caption><p>Information of lineage-specific domains in <italic>Branchiostoma japonicum</italic>.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_7.xlsx" id="SM10" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S7</label>
<caption><p>Information of lineage-specific domains in <italic>Asymmetron lucayanum</italic>.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_8.xlsx" id="SM11" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>TABLE S8</label>
<caption><p>List of GO terms enriched by genes containing lineage-specific domains in each species of amphioxus.</p></caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Abascal</surname> <given-names>F.</given-names></name> <name><surname>Zardoya</surname> <given-names>R.</given-names></name> <name><surname>Posada</surname> <given-names>D.</given-names></name></person-group> (<year>2005</year>). <article-title>ProtTest: selection of best-fit models of protein evolution.</article-title> <source><italic>Bioinformatics</italic></source> <volume>21</volume> <fpage>2104</fpage>&#x2013;<lpage>2105</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bti263</pub-id> <pub-id pub-id-type="pmid">15647292</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baele</surname> <given-names>G.</given-names></name> <name><surname>Lemey</surname> <given-names>P.</given-names></name> <name><surname>Bedford</surname> <given-names>T.</given-names></name> <name><surname>Rambaut</surname> <given-names>A.</given-names></name> <name><surname>Suchard</surname> <given-names>M. A.</given-names></name> <name><surname>Alekseyenko</surname> <given-names>A. V.</given-names></name></person-group> (<year>2012</year>). <article-title>Improving the accuracy of demographic and molecular clock model comparison while accommodating phylogenetic uncertainty.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>29</volume> <fpage>2157</fpage>&#x2013;<lpage>2167</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/mss084</pub-id> <pub-id pub-id-type="pmid">22403239</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Benton</surname> <given-names>M. J.</given-names></name> <name><surname>Donoghue</surname> <given-names>P. C.</given-names></name></person-group> (<year>2007</year>). <article-title>Paleontological evidence to date the tree of life.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>24</volume> <fpage>26</fpage>&#x2013;<lpage>53</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msl150</pub-id> <pub-id pub-id-type="pmid">17047029</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brown</surname> <given-names>J.</given-names></name> <name><surname>Pirrung</surname> <given-names>M.</given-names></name> <name><surname>Mccue</surname> <given-names>L. A.</given-names></name></person-group> (<year>2017</year>). <article-title>FQC dashboard: integrates FastQC results into a web-based, interactive, and extensible FASTQ quality control tool.</article-title> <source><italic>Bioinformatics</italic></source> <volume>33</volume> <fpage>3137</fpage>&#x2013;<lpage>3139</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx373</pub-id> <pub-id pub-id-type="pmid">28605449</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cabili</surname> <given-names>M. N.</given-names></name> <name><surname>Trapnell</surname> <given-names>C.</given-names></name> <name><surname>Goff</surname> <given-names>L.</given-names></name> <name><surname>Koziol</surname> <given-names>M.</given-names></name> <name><surname>Tazonvega</surname> <given-names>B.</given-names></name> <name><surname>Regev</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Integrative annotation of human large intergenic noncoding RNAs reveals global properties and specific subclasses.</article-title> <source><italic>Gene. Dev.</italic></source> <volume>25</volume> <fpage>1915</fpage>&#x2013;<lpage>1927</lpage>. <pub-id pub-id-type="doi">10.1101/gad.17446611</pub-id> <pub-id pub-id-type="pmid">21890647</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J. Y.</given-names></name> <name><surname>Huang</surname> <given-names>D. Y.</given-names></name> <name><surname>Li</surname> <given-names>C. W.</given-names></name></person-group> (<year>1999</year>). <article-title>An early <italic>Cambrian craniate</italic>-like chordate.</article-title> <source><italic>Nature</italic></source> <volume>402</volume> <fpage>518</fpage>&#x2013;<lpage>522</lpage>. <pub-id pub-id-type="doi">10.1038/990080</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Conesa</surname> <given-names>A.</given-names></name> <name><surname>G&#x00F6;tz</surname> <given-names>S.</given-names></name> <name><surname>Garc&#x00ED;ag&#x00F3;mez</surname> <given-names>J. M.</given-names></name> <name><surname>Terol</surname> <given-names>J.</given-names></name> <name><surname>Tal&#x00F3;n</surname> <given-names>M.</given-names></name> <name><surname>Robles</surname> <given-names>M.</given-names></name></person-group> (<year>2005</year>). <article-title>Blast2GO: a universal tool for annotation, visualization and analysis in functional genomics research.</article-title> <source><italic>Bioinformatics</italic></source> <volume>21</volume> <fpage>3674</fpage>&#x2013;<lpage>3676</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bti610</pub-id> <pub-id pub-id-type="pmid">16081474</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dos</surname> <given-names>R. M.</given-names></name> <name><surname>Yang</surname> <given-names>Z.</given-names></name></person-group> (<year>2011</year>). <article-title>Approximate likelihood calculation on a phylogeny for Bayesian estimation of divergence times.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>28</volume> <fpage>2161</fpage>&#x2013;<lpage>2172</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msr045</pub-id> <pub-id pub-id-type="pmid">21310946</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ebersberger</surname> <given-names>I.</given-names></name> <name><surname>Strauss</surname> <given-names>S.</given-names></name> <name><surname>von Haeseler</surname> <given-names>A.</given-names></name></person-group> (<year>2009</year>). <article-title>HaMStR: profile hidden markov model based search for orthologs in ESTs.</article-title> <source><italic>BMC Evol. Biol.</italic></source> <volume>9</volume>:<issue>157</issue>. <pub-id pub-id-type="doi">10.1186/1471-2148-9-157</pub-id> <pub-id pub-id-type="pmid">19586527</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Edgar</surname> <given-names>R. C.</given-names></name></person-group> (<year>2004</year>). <article-title>MUSCLE: multiple sequence alignment with high accuracy and high throughput.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>1792</fpage>&#x2013;<lpage>1797</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh340</pub-id> <pub-id pub-id-type="pmid">15034147</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Finn</surname> <given-names>R. D.</given-names></name> <name><surname>Clements</surname> <given-names>J.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name></person-group> (<year>2011</year>). <article-title>HMMER web server: interactive sequence similarity searching.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>39</volume> <fpage>W29</fpage>&#x2013;<lpage>W37</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkr367</pub-id> <pub-id pub-id-type="pmid">21593126</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frisch</surname> <given-names>T.</given-names></name> <name><surname>Dawes</surname> <given-names>P. R.</given-names></name></person-group> (<year>2014</year>). <article-title>The rotations opening the Central and Northern Atlantic Ocean: compilation, drift lines, and flow lines.</article-title> <source><italic>Int. J. Earth Sci.</italic></source> <volume>103</volume> <fpage>967</fpage>&#x2013;<lpage>969</lpage>. <pub-id pub-id-type="doi">10.1007/s00531-013-0980-7</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Yassour</surname> <given-names>M.</given-names></name> <name><surname>Levin</surname> <given-names>J. Z.</given-names></name> <name><surname>Thompson</surname> <given-names>D. A.</given-names></name> <name><surname>Amit</surname> <given-names>I.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>29</volume> <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id> <pub-id pub-id-type="pmid">21572440</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guindon</surname> <given-names>S.</given-names></name> <name><surname>Dufayard</surname> <given-names>J.</given-names></name> <name><surname>Lefort</surname> <given-names>V.</given-names></name> <name><surname>Anisimova</surname> <given-names>M.</given-names></name> <name><surname>Hordijk</surname> <given-names>W.</given-names></name> <name><surname>Gascuel</surname> <given-names>O.</given-names></name></person-group> (<year>2010</year>). <article-title>New algorithms and methods to estimate maximum-likelihood phylogenies: assessing the performance of PhyML 3.0.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>59</volume> <fpage>307</fpage>&#x2013;<lpage>321</lpage>. <pub-id pub-id-type="doi">10.1093/sysbio/syq010</pub-id> <pub-id pub-id-type="pmid">20525638</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guy</surname> <given-names>S. C. S.</given-names></name> <name><surname>Birney</surname> <given-names>E.</given-names></name></person-group> (<year>2005</year>). <article-title>Automated generation of heuristics for biological sequence comparison.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>6</volume>:<issue>31</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-6-31</pub-id> <pub-id pub-id-type="pmid">15713233</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Havird</surname> <given-names>J. C.</given-names></name> <name><surname>Santos</surname> <given-names>S. R.</given-names></name></person-group> (<year>2014</year>). <article-title>Performance of single and concatenated sets of mitochondrial genes at inferring metazoan relationships relative to full mitogenome data.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e84080</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0084080</pub-id> <pub-id pub-id-type="pmid">24454717</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Heled</surname> <given-names>J.</given-names></name> <name><surname>Drummond</surname> <given-names>A. J.</given-names></name></person-group> (<year>2009</year>). <article-title>Bayesian inference of species trees from multilocus data.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>27</volume> <fpage>570</fpage>&#x2013;<lpage>580</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msp274</pub-id> <pub-id pub-id-type="pmid">19906793</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hou</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>Tethyan changes shaped aquatic diversification.</article-title> <source><italic>Biol. Rev.</italic></source> <volume>93</volume> <fpage>874</fpage>&#x2013;<lpage>896</lpage>. <pub-id pub-id-type="doi">10.1111/brv.12376</pub-id> <pub-id pub-id-type="pmid">29024366</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>S.</given-names></name> <name><surname>Chen</surname> <given-names>Z.</given-names></name> <name><surname>Yan</surname> <given-names>X.</given-names></name> <name><surname>Yu</surname> <given-names>T.</given-names></name> <name><surname>Huang</surname> <given-names>G.</given-names></name> <name><surname>Yan</surname> <given-names>Q.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Decelerated genome evolution in modern vertebrates revealed by analysis of multiple lancelet genomes.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>5</volume>:<issue>5896</issue>. <pub-id pub-id-type="doi">10.1038/ncomms6896</pub-id> <pub-id pub-id-type="pmid">25523484</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iseli</surname> <given-names>C.</given-names></name> <name><surname>Jongeneel</surname> <given-names>C. V.</given-names></name> <name><surname>Bucher</surname> <given-names>P.</given-names></name></person-group> (<year>1999</year>). <article-title>ESTScan: a program for detecting, evaluating, and reconstructing potential coding regions in EST sequences.</article-title> <source><italic>Proc. Int. Conf. Intell. Syst. Mol. Biol.</italic></source> <volume>1999</volume> <fpage>138</fpage>&#x2013;<lpage>148</lpage>. <pub-id pub-id-type="pmid">10786296</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Itoh</surname> <given-names>M.</given-names></name> <name><surname>Nacher</surname> <given-names>J. C.</given-names></name> <name><surname>Kuma</surname> <given-names>K. I.</given-names></name> <name><surname>Goto</surname> <given-names>S.</given-names></name> <name><surname>Kanehisa</surname> <given-names>M.</given-names></name></person-group> (<year>2007</year>). <article-title>Evolutionary history and functional implications of protein domains and their combinations in eukaryotes.</article-title> <source><italic>Genome Biol.</italic></source> <volume>8</volume>:<issue>R121</issue>. <pub-id pub-id-type="doi">10.1186/gb-2007-8-6-r121</pub-id> <pub-id pub-id-type="pmid">17588271</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jantzen</surname> <given-names>S. G.</given-names></name> <name><surname>Sutherland</surname> <given-names>B. J.</given-names></name> <name><surname>Minkley</surname> <given-names>D. R.</given-names></name> <name><surname>Koop</surname> <given-names>B. F.</given-names></name></person-group> (<year>2011</year>). <article-title>GO trimming: systematically reducing redundancy in large gene ontology datasets.</article-title> <source><italic>BMC Res. Notes</italic></source> <volume>4</volume>:<issue>267</issue>. <pub-id pub-id-type="doi">10.1186/1756-0500-4-267</pub-id> <pub-id pub-id-type="pmid">21798041</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kocot</surname> <given-names>K. M.</given-names></name> <name><surname>Citarella</surname> <given-names>M. R.</given-names></name> <name><surname>Moroz</surname> <given-names>L. L.</given-names></name> <name><surname>Halanych</surname> <given-names>K. M.</given-names></name></person-group> (<year>2013</year>). <article-title>PhyloTreePruner: a phylogenetic tree-based approach for selection of orthologous sequences for phylogenomics.</article-title> <source><italic>Evol. Bioinformat. Online</italic></source> <volume>2013</volume> <fpage>429</fpage>&#x2013;<lpage>435</lpage>. <pub-id pub-id-type="doi">10.4137/EBO.S12813</pub-id> <pub-id pub-id-type="pmid">24250218</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kon</surname> <given-names>T.</given-names></name> <name><surname>Nohara</surname> <given-names>M.</given-names></name> <name><surname>Nishida</surname> <given-names>M.</given-names></name> <name><surname>Sterrer</surname> <given-names>W.</given-names></name> <name><surname>Nishikawa</surname> <given-names>T.</given-names></name></person-group> (<year>2006</year>). <article-title>Hidden ancient diversification in the circumtropical lancelet <italic>Asymmetron lucayanum</italic> complex.</article-title> <source><italic>Mar. Biol.</italic></source> <volume>149</volume> <fpage>875</fpage>&#x2013;<lpage>883</lpage>. <pub-id pub-id-type="doi">10.1007/s00227-006-0271-y</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kon</surname> <given-names>T.</given-names></name> <name><surname>Nohara</surname> <given-names>M.</given-names></name> <name><surname>Yamanoue</surname> <given-names>Y.</given-names></name> <name><surname>Fujiwara</surname> <given-names>Y.</given-names></name> <name><surname>Nishida</surname> <given-names>M.</given-names></name> <name><surname>Nishikawa</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Phylogenetic position of a whale-fall lancelet (<italic>Cephalochordata</italic>) inferred from whole mitochondrial genome sequences.</article-title> <source><italic>BMC Evol. Biol.</italic></source> <volume>7</volume>:<issue>127</issue>. <pub-id pub-id-type="doi">10.1186/1471-2148-7-127</pub-id> <pub-id pub-id-type="pmid">17663797</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koop</surname> <given-names>D.</given-names></name> <name><surname>Holland</surname> <given-names>L. Z.</given-names></name></person-group> (<year>2008</year>). <article-title>The basal chordate amphioxus as a simple model for elucidating developmental mechanisms in vertebrates.</article-title> <source><italic>Birth Defects Res. Part C Embryo Today Rev.</italic></source> <volume>84</volume> <fpage>175</fpage>&#x2013;<lpage>187</lpage>. <pub-id pub-id-type="doi">10.1002/bdrc.20128</pub-id> <pub-id pub-id-type="pmid">18773463</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kriventseva</surname> <given-names>E. V.</given-names></name> <name><surname>Tegenfeldt</surname> <given-names>F.</given-names></name> <name><surname>Petty</surname> <given-names>T. J.</given-names></name> <name><surname>Waterhouse</surname> <given-names>R. M.</given-names></name> <name><surname>Sim&#x00E3;o</surname> <given-names>F. A.</given-names></name> <name><surname>Pozdnyakov</surname> <given-names>I. A.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>OrthoDB v8: update of the hierarchical catalog of orthologs and the underlying free software.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>D250</fpage>&#x2013;<lpage>D256</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku1220</pub-id> <pub-id pub-id-type="pmid">25428351</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lartillot</surname> <given-names>N.</given-names></name> <name><surname>Rodrigue</surname> <given-names>N.</given-names></name> <name><surname>Stubbs</surname> <given-names>D.</given-names></name> <name><surname>Richer</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>PhyloBayes MPI: phylogenetic reconstruction with infinite mixtures of profiles in a parallel environment.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>62</volume> <fpage>611</fpage>&#x2013;<lpage>615</lpage>. <pub-id pub-id-type="doi">10.1093/sysbio/syt022</pub-id> <pub-id pub-id-type="pmid">23564032</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lechner</surname> <given-names>M.</given-names></name> <name><surname>Findei&#x00DF;</surname> <given-names>S.</given-names></name> <name><surname>Steiner</surname> <given-names>L.</given-names></name> <name><surname>Marz</surname> <given-names>M.</given-names></name> <name><surname>Stadler</surname> <given-names>P. F.</given-names></name> <name><surname>Prohaska</surname> <given-names>S. J.</given-names></name></person-group> (<year>2011</year>). <article-title>Proteinortho: detection of (Co-)orthologs in large-scale analysis.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>12</volume>:<issue>124</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-12-124</pub-id> <pub-id pub-id-type="pmid">21526987</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>F.</given-names></name> <name><surname>Xiao</surname> <given-names>Y.</given-names></name> <name><surname>Huang</surname> <given-names>F.</given-names></name> <name><surname>Deng</surname> <given-names>W.</given-names></name> <name><surname>Zhao</surname> <given-names>H.</given-names></name> <name><surname>Shi</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Spatiotemporal-specific lncRNAs in the brain, colon, liver and lung of macaque during development.</article-title> <source><italic>Mol. Biosyst.</italic></source> <volume>11</volume> <fpage>3253</fpage>&#x2013;<lpage>3263</lpage>. <pub-id pub-id-type="doi">10.1039/c5mb00474h</pub-id> <pub-id pub-id-type="pmid">26456323</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>Y. W.</given-names></name> <name><surname>Yu</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>Y. P.</given-names></name></person-group> (<year>2007</year>). <article-title>&#x201C;Long-branch Attraction&#x201D; artifact in phylogenetic reconstruction.</article-title> <source><italic>Hereditas</italic></source> <volume>29</volume> <fpage>659</fpage>&#x2013;<lpage>667</lpage>. <pub-id pub-id-type="doi">10.1360/yc-007-0659</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>L&#x00F6;ytynoja</surname> <given-names>A.</given-names></name> <name><surname>Goldman</surname> <given-names>N.</given-names></name></person-group> (<year>2005</year>). <article-title>An algorithm for progressive multiple alignment of sequences with insertions.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>102</volume> <fpage>10557</fpage>&#x2013;<lpage>10562</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0409137102</pub-id> <pub-id pub-id-type="pmid">16000407</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>J. C.</given-names></name> <name><surname>Xiao</surname> <given-names>Y. S.</given-names></name> <name><surname>Song</surname> <given-names>L.</given-names></name> <name><surname>Gao</surname> <given-names>T.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name></person-group> (<year>2007</year>). <article-title>Phylogenetic separation of lancelets in China revealed by mitochondrial COI and Cyt b gene analysis.</article-title> <source><italic>S. China Fish. Sci.</italic></source> <volume>3</volume> <fpage>8</fpage>&#x2013;<lpage>14</lpage>.</citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mateosgonzalez</surname> <given-names>F.</given-names></name> <name><surname>Sundstr&#x00F6;m</surname> <given-names>L. F.</given-names></name> <name><surname>Schmid</surname> <given-names>M.</given-names></name> <name><surname>Bj&#x00F6;rklund</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>Rapid evolution of parasite resistance in a warmer environment: insights from a large scale field experiment.</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<issue>e0128860</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0128860</pub-id> <pub-id pub-id-type="pmid">26035300</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meynard</surname> <given-names>C. N.</given-names></name> <name><surname>Mouillot</surname> <given-names>D.</given-names></name> <name><surname>Mouquet</surname> <given-names>N.</given-names></name> <name><surname>Douzery</surname> <given-names>E. J. P.</given-names></name></person-group> (<year>2012</year>). <article-title>A phylogenetic perspective on the evolution of mediterranean teleost fishes.</article-title> <source><italic>PLoS One</italic></source> <volume>7</volume>:<issue>e36443</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0036443</pub-id> <pub-id pub-id-type="pmid">22590545</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mirarab</surname> <given-names>S.</given-names></name> <name><surname>Bayzid</surname> <given-names>M. S.</given-names></name> <name><surname>Warnow</surname> <given-names>T.</given-names></name></person-group> (<year>2016</year>). <article-title>Evaluating summary methods for multilocus species tree estimation in the presence of incomplete lineage sorting.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>65</volume> <fpage>366</fpage>&#x2013;<lpage>380</lpage>. <pub-id pub-id-type="doi">10.1093/sysbio/syu063</pub-id> <pub-id pub-id-type="pmid">25164915</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Misof</surname> <given-names>B.</given-names></name> <name><surname>Liu</surname> <given-names>S.</given-names></name> <name><surname>Meusemann</surname> <given-names>K.</given-names></name> <name><surname>Peters</surname> <given-names>R. S.</given-names></name> <name><surname>Donath</surname> <given-names>A.</given-names></name> <name><surname>Mayer</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Phylogenomics resolves the timing and pattern of insect evolution.</article-title> <source><italic>Science</italic></source> <volume>346</volume> <fpage>763</fpage>&#x2013;<lpage>767</lpage>. <pub-id pub-id-type="doi">10.1126/science.1257570</pub-id> <pub-id pub-id-type="pmid">25378627</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moreno-Hagelsieb</surname> <given-names>G.</given-names></name> <name><surname>Latimer</surname> <given-names>K.</given-names></name></person-group> (<year>2008</year>). <article-title>Choosing BLAST options for better detection of orthologs as reciprocal best hits.</article-title> <source><italic>Bioinformatics</italic></source> <volume>24</volume> <fpage>319</fpage>&#x2013;<lpage>324</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btm585</pub-id> <pub-id pub-id-type="pmid">18042555</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mount</surname> <given-names>D. W.</given-names></name></person-group> (<year>2007</year>). <article-title>Using the basic local alignment search tool (BLAST).</article-title> <source><italic>CSH Protoc.</italic></source> <volume>2007</volume>:<issue>pdb.top17</issue>. <pub-id pub-id-type="doi">10.1101/pdb.top17</pub-id> <pub-id pub-id-type="pmid">21357135</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mulcahy</surname> <given-names>D. G.</given-names></name> <name><surname>Noonan</surname> <given-names>B. P.</given-names></name> <name><surname>Moss</surname> <given-names>T.</given-names></name> <name><surname>Townsend</surname> <given-names>T. M.</given-names></name> <name><surname>Reeder</surname> <given-names>T. W.</given-names></name> <name><surname>Sites</surname> <given-names>J. W.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Estimating divergence dates and evaluating dating methods using phylogenomic and mitochondrial data in squamate reptiles.</article-title> <source><italic>Mol. Phylogen. Evol.</italic></source> <volume>65</volume> <fpage>974</fpage>&#x2013;<lpage>991</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2012.08.018</pub-id> <pub-id pub-id-type="pmid">22982760</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peterson</surname> <given-names>K. J.</given-names></name> <name><surname>Cotton</surname> <given-names>J. A.</given-names></name> <name><surname>Gehling</surname> <given-names>J. G.</given-names></name> <name><surname>Pisani</surname> <given-names>D.</given-names></name></person-group> (<year>2008</year>). <article-title>The Ediacaran emergence of bilaterians: congruence between the genetic and the geological fossil records.</article-title> <source><italic>Philos. Trans. R. Soc. Lond. B Biol. Sci.</italic></source> <volume>363</volume> <fpage>1435</fpage>&#x2013;<lpage>1443</lpage>. <pub-id pub-id-type="doi">10.1098/rstb.2007.2233</pub-id> <pub-id pub-id-type="pmid">18192191</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Philippe</surname> <given-names>H.</given-names></name> <name><surname>Delsuc</surname> <given-names>F.</given-names></name> <name><surname>Brinkmann</surname> <given-names>H.</given-names></name> <name><surname>Lartillot</surname> <given-names>N.</given-names></name></person-group> (<year>2005</year>). <article-title>Phylogenomics.</article-title> <source><italic>Annu. Rev. Ecol. Evol. Syst.</italic></source> <volume>36</volume> <fpage>541</fpage>&#x2013;<lpage>562</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.ecolsys.35.112202.130205</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Putnam</surname> <given-names>N. H.</given-names></name> <name><surname>Butts</surname> <given-names>T.</given-names></name> <name><surname>Ferrier</surname> <given-names>D. E. K.</given-names></name> <name><surname>Furlong</surname> <given-names>R. F.</given-names></name> <name><surname>Hellsten</surname> <given-names>U.</given-names></name> <name><surname>Kawashima</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>The amphioxus genome and the evolution of the chordate karyotype.</article-title> <source><italic>Nature</italic></source> <volume>453</volume> <fpage>1064</fpage>&#x2013;<lpage>1071</lpage>. <pub-id pub-id-type="doi">10.1038/nature06967</pub-id> <pub-id pub-id-type="pmid">18563158</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rannala</surname> <given-names>B.</given-names></name> <name><surname>Yang</surname> <given-names>Z.</given-names></name></person-group> (<year>2007</year>). <article-title>Inferring speciation times under an episodic molecular clock.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>56</volume> <fpage>453</fpage>&#x2013;<lpage>466</lpage>. <pub-id pub-id-type="doi">10.1080/10635150701420643</pub-id> <pub-id pub-id-type="pmid">17558967</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rekapalli</surname> <given-names>B.</given-names></name> <name><surname>Halloy</surname> <given-names>C.</given-names></name> <name><surname>Zhulin</surname> <given-names>I. B.</given-names></name></person-group> (<year>2009</year>). <article-title>&#x201C;HSP-HMMER:a tool for protein domain identification on a large scale,&#x201D; in</article-title> <source><italic>Proceedings of the ACM Symposium on Applied Computing</italic></source> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM, Inc.</publisher-name>) <fpage>766</fpage>&#x2013;<lpage>770</lpage>.</citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ronquist</surname> <given-names>F.</given-names></name> <name><surname>Teslenko</surname> <given-names>M.</given-names></name> <name><surname>van der Mark</surname> <given-names>P.</given-names></name> <name><surname>Ayres</surname> <given-names>D. L.</given-names></name> <name><surname>Darling</surname> <given-names>A.</given-names></name> <name><surname>H&#x00F6;hna</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>MrBayes 3.2: efficient Bayesian phylogenetic inference and model choice across a large model space.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>61</volume> <fpage>539</fpage>&#x2013;<lpage>542</lpage>. <pub-id pub-id-type="doi">10.1093/sysbio/sys029</pub-id> <pub-id pub-id-type="pmid">22357727</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanderson</surname> <given-names>M. J.</given-names></name></person-group> (<year>2002</year>). <article-title>Estimating absolute rates of molecular evolution and divergence times: a penalized likelihood approach.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>19</volume> <fpage>101</fpage>&#x2013;<lpage>109</lpage>. <pub-id pub-id-type="doi">10.1093/oxfordjournals.molbev.a003974</pub-id> <pub-id pub-id-type="pmid">11752195</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanderson</surname> <given-names>M. J.</given-names></name></person-group> (<year>2003</year>). <article-title>r8s: inferring absolute rates of molecular evolution and divergence times in the absence of a molecular clock.</article-title> <source><italic>Bioinformatics</italic></source> <volume>19</volume> <fpage>301</fpage>&#x2013;<lpage>302</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/19.2.301</pub-id> <pub-id pub-id-type="pmid">12538260</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sayyari</surname> <given-names>E.</given-names></name> <name><surname>Mirarab</surname> <given-names>S.</given-names></name></person-group> (<year>2016</year>). <article-title>Fast coalescent-based computation of local branch support from quartet frequencies.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>33</volume> <fpage>1654</fpage>&#x2013;<lpage>1668</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msw079</pub-id> <pub-id pub-id-type="pmid">27189547</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schwartz</surname> <given-names>R. S.</given-names></name> <name><surname>Mueller</surname> <given-names>R. L.</given-names></name></person-group> (<year>2010</year>). <article-title>Branch length estimation and divergence dating: estimates of error in Bayesian and maximum likelihood frameworks.</article-title> <source><italic>BMC Evol. Biol.</italic></source> <volume>10</volume>:<issue>5</issue>. <pub-id pub-id-type="doi">10.1186/1471-2148-10-5</pub-id> <pub-id pub-id-type="pmid">20064267</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shimeld</surname> <given-names>S. M.</given-names></name> <name><surname>Holland</surname> <given-names>N. D.</given-names></name></person-group> (<year>2005</year>). <article-title>Amphioxus molecular biology: insights into vertebrate evolution and developmental mechanisms.</article-title> <source><italic>Rev. Canadienne De Zool.</italic></source> <volume>83</volume> <fpage>90</fpage>&#x2013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1139/z04-155</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Silvan</surname> <given-names>O.</given-names></name> <name><surname>Stephanie</surname> <given-names>B.</given-names></name> <name><surname>Belgacem</surname> <given-names>M. R.</given-names></name> <name><surname>Yann</surname> <given-names>L. P.</given-names></name> <name><surname>Hector</surname> <given-names>E.</given-names></name></person-group> (<year>2012</year>). <article-title>Sequencing and analysis of the mediterranean amphioxus (<italic>Branchiostoma lanceolatum</italic>) transcriptome.</article-title> <source><italic>PLoS One</italic></source> <volume>7</volume>:<issue>e36554</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0036554</pub-id> <pub-id pub-id-type="pmid">22590565</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>H. A.</given-names></name></person-group> (<year>2014</year>). <article-title>The geodetic evidence concerning Wegener&#x2019;s hypothesis.</article-title> <source><italic>Empire Surv. Rev.</italic></source> <volume>9</volume> <fpage>90</fpage>&#x2013;<lpage>100</lpage>. <pub-id pub-id-type="doi">10.1179/sre.1947.9.65.90</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>Y. B.</given-names></name></person-group> (<year>2017</year>). <article-title>FasParser: a package for manipulating sequence data.</article-title> <source><italic>Zool. Res.</italic></source> <volume>38</volume> <fpage>110</fpage>&#x2013;<lpage>112</lpage>. <pub-id pub-id-type="doi">10.24272/j.issn.2095-8137.2017.017</pub-id> <pub-id pub-id-type="pmid">28409507</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tajima</surname> <given-names>F.</given-names></name></person-group> (<year>1993</year>). <article-title>Simple methods for testing the molecular evolutionary clock hypothesis.</article-title> <source><italic>Genetics</italic></source> <volume>135</volume> <fpage>599</fpage>&#x2013;<lpage>607</lpage>. <pub-id pub-id-type="pmid">8244016</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Talavera</surname> <given-names>G.</given-names></name> <name><surname>Castresana</surname> <given-names>J.</given-names></name></person-group> (<year>2007</year>). <article-title>Improvement of phylogenies after removing divergent and ambiguously aligned blocks from protein sequence alignments.</article-title> <source><italic>Syst. Biol.</italic></source> <volume>56</volume> <fpage>564</fpage>&#x2013;<lpage>577</lpage>. <pub-id pub-id-type="doi">10.1080/10635150701472164</pub-id> <pub-id pub-id-type="pmid">17654362</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Venkatesh</surname> <given-names>B.</given-names></name> <name><surname>Lee</surname> <given-names>A. P.</given-names></name> <name><surname>Ravi</surname> <given-names>V.</given-names></name> <name><surname>Maurya</surname> <given-names>A. K.</given-names></name> <name><surname>Lian</surname> <given-names>M. M.</given-names></name> <name><surname>Swann</surname> <given-names>J. B.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Elephant shark genome provides unique insights into gnathostome evolution.</article-title> <source><italic>Nature</italic></source> <volume>505</volume> <fpage>174</fpage>&#x2013;<lpage>179</lpage>. <pub-id pub-id-type="doi">10.1038/nature12826</pub-id> <pub-id pub-id-type="pmid">24402279</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vogel</surname> <given-names>C.</given-names></name> <name><surname>Bashton</surname> <given-names>M.</given-names></name> <name><surname>Kerrison</surname> <given-names>N. D.</given-names></name> <name><surname>Chothia</surname> <given-names>C.</given-names></name> <name><surname>Teichmann</surname> <given-names>S. A.</given-names></name></person-group> (<year>2004</year>). <article-title>Structure, function and evolution of multidomain proteins.</article-title> <source><italic>Curr. Opin. Struct. Biol.</italic></source> <volume>14</volume> <fpage>208</fpage>&#x2013;<lpage>216</lpage>. <pub-id pub-id-type="doi">10.1016/j.sbi.2004.03.011</pub-id> <pub-id pub-id-type="pmid">15093836</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>M. L.</given-names></name> <name><surname>Zhang</surname> <given-names>Q. L.</given-names></name> <name><surname>Guo</surname> <given-names>Z. L.</given-names></name> <name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Shen</surname> <given-names>Y. Y.</given-names></name></person-group> (<year>2015</year>). <article-title>The complete mitochondrial genome of <italic>Corizus tetraspilus</italic> (Hemiptera: Rhopalidae) and phylogenetic analysis of Pentatomomorpha.</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<issue>e0129003</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0129003</pub-id> <pub-id pub-id-type="pmid">26042898</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>M. L.</given-names></name> <name><surname>Zhang</surname> <given-names>Q. L.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Guo</surname> <given-names>Z. L.</given-names></name> <name><surname>Liu</surname> <given-names>Y. J.</given-names></name> <name><surname>Shen</surname> <given-names>Y. Y.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>High-level phylogeny of the Coleoptera inferred with mitochondrial genome sequences.</article-title> <source><italic>Mol. Phylogen. Evol.</italic></source> <volume>104</volume> <fpage>99</fpage>&#x2013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2016.08.002</pub-id> <pub-id pub-id-type="pmid">27497607</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yuan</surname> <given-names>M. L.</given-names></name> <name><surname>Zhang</surname> <given-names>Q. L.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name> <name><surname>Jia</surname> <given-names>C. L.</given-names></name> <name><surname>Li</surname> <given-names>X. P.</given-names></name> <name><surname>Yang</surname> <given-names>X. Z.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Mitochondrial phylogeny, divergence history and high-altitude adaptation of grassland caterpillars (Lepidoptera: Lymantriinae: Gynaephora) inhabiting the Tibetan Plateau.</article-title> <source><italic>Mol. Phylogen. Evol.</italic></source> <volume>122</volume> <fpage>116</fpage>&#x2013;<lpage>124</lpage>. <pub-id pub-id-type="doi">10.1016/j.ympev.2018.01.016</pub-id> <pub-id pub-id-type="pmid">29408286</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yue</surname> <given-names>J. X.</given-names></name> <name><surname>Yu</surname> <given-names>J. K.</given-names></name> <name><surname>Putnam</surname> <given-names>N. H.</given-names></name> <name><surname>Holland</surname> <given-names>L. Z.</given-names></name></person-group> (<year>2014</year>). <article-title>The transcriptome of an amphioxus, <italic>Asymmetron lucayanum</italic>, from the Bahamas: a window into chordate evolution.</article-title> <source><italic>Genome Biol. Evol.</italic></source> <volume>6</volume> <fpage>2681</fpage>&#x2013;<lpage>2696</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evu212</pub-id> <pub-id pub-id-type="pmid">25240057</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Q. L.</given-names></name> <name><surname>Xu</surname> <given-names>B.</given-names></name> <name><surname>Wang</surname> <given-names>X. Q.</given-names></name> <name><surname>Yuan</surname> <given-names>M. L.</given-names></name> <name><surname>Chen</surname> <given-names>J. Y.</given-names></name></person-group> (<year>2018</year>). <article-title>Genome-wide comparison of the protein-coding repertoire reveals fast evolution of immune-related genes in cephalochordates and <italic>Osteichthyes superclass</italic>.</article-title> <source><italic>Oncotarget</italic></source> <volume>9</volume>:<issue>83</issue>. <pub-id pub-id-type="doi">10.18632/oncotarget.22749</pub-id> <pub-id pub-id-type="pmid">29416598</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn01"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="http://www.hmmer.org/">http://www.hmmer.org/</ext-link></p></fn>
<fn id="fn02"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/">https://cran.r-project.org/</ext-link></p></fn>
<fn id="fn03"><label>3</label><p><ext-link ext-link-type="uri" xlink:href="http://www.genoscope.cns.fr/spip/L-espece-d-amphioxus-un-modele.html">http://www.genoscope.cns.fr/spip/L-espece-d-amphioxus-un-modele.html</ext-link></p></fn>
</fn-group>
</back>
</article>