<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Archiving and Interchange DTD v2.3 20070202//EN" "archivearticle.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="methods-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Virol.</journal-id>
<journal-title>Frontiers in Virology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Virol.</abbrev-journal-title>
<issn pub-type="epub">2673-818X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fviro.2021.751196</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Virology</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A Non-phylogeny-dependent Reassortment Detection Method for Influenza A Viruses</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Gong</surname> <given-names>Xingfei</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1428029/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Hu</surname> <given-names>Mingda</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/482632/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Boqian</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname> <given-names>Haoyi</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1426873/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Jin</surname> <given-names>Yuan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/742760/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Liang</surname> <given-names>Long</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/481889/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yue</surname> <given-names>Junjie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/482465/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Chen</surname> <given-names>Wei</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x0002A;</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Ren</surname> <given-names>Hongguang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/510948/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Beijing Institute of Biotechnology, State Key Laboratory of Pathogen and Biosecurity</institution>, <addr-line>Beijing</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>College of Computer, National University of Defense Technology</institution>, <addr-line>Changsha</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Diego Forni, Eugenio Medea (IRCCS), Italy</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Irina V. Kiseleva, Institute of Experimental Medicine (RAS), Russia; Richard Johnathan Orton, University of Glasgow, United Kingdom</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Hongguang Ren <email>bioren&#x00040;163.com</email></corresp>
<corresp id="c002">Wei Chen <email>chenwei&#x00040;nudt.edu.cn</email></corresp>
<corresp id="c003">Junjie Yue <email>yue_junjie&#x00040;126.com</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Bioinformatic and Predictive Virology, a section of the journal Frontiers in Virology</p></fn>
<fn fn-type="equal" id="fn002"><p>&#x02020;These authors have contributed equally to this work</p></fn></author-notes>
<pub-date pub-type="epub">
<day>07</day>
<month>12</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>1</volume>
<elocation-id>751196</elocation-id>
<history>
<date date-type="received">
<day>09</day>
<month>10</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2021 Gong, Hu, Wang, Yang, Jin, Liang, Yue, Chen and Ren.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Gong, Hu, Wang, Yang, Jin, Liang, Yue, Chen and Ren</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>Influenza A virus is a segmented RNA virus whose genome consists of 8 single-stranded negative-sense RNA segments. This unique genetic structure allows viruses to exchange their segments through reassortment when they infect the same host cell. Studying the determination and nature of influenza A virus reassortment is critical to understanding the generation of pandemic strains and the spread of viruses across species. Reassortment detection is the first step in influenza A virus reassortment research. Several methods for automatic detection of reassortment have been proposed, which can be roughly divided into two categories: phylogenetic methods and distance methods. In this article, we proposed a reassortment detection method that does not require multiple sequence alignment and phylogenetic analysis. We extracted the codon features from the segment sequence and expressed the sequence as a feature vector, and then used the clustering method of self-organizing map to cluster the sequence for each segment. Based on the clustering results and the epidemiological information of the virus, the reassortment detection was implemented. We used this method to perform reassortment detection on the collected 7,075 strains from Asia and identified 516 reassortment events. We also conducted a statistical analysis of the identified reassortment events and found conclusions consistent with previous studies. Our method will provide new insights for automating reassortment detection tasks and understanding the reassortment patterns of influenza A viruses.</p></abstract>
<kwd-group>
<kwd>influenza A virus</kwd>
<kwd>reassortment</kwd>
<kwd>detection</kwd>
<kwd>method</kwd>
<kwd>evolution</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="1"/>
<equation-count count="3"/>
<ref-count count="29"/>
<page-count count="9"/>
<word-count count="5391"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Annual epidemics and occasional pandemics caused by the influenza A virus (IAV) are important threats to human health. IAV can cause acute respiratory infections and cause high morbidity and mortality (<xref ref-type="bibr" rid="B1">1</xref>). Influenza A virus is a segmented RNA virus whose genome consists of 8 single-stranded, negative-sense RNA segments. When multiple influenza A viruses infect the same host cell, due to the genome characteristics of segmented viruses, the genomes of multiple viruses may exchange their segments, resulting in progeny viruses with new genome combinations (<xref ref-type="bibr" rid="B2">2</xref>). This process is called reassortment. Reassortment plays an important but undefined role in the cross-species transmission of influenza A virus (<xref ref-type="bibr" rid="B3">3</xref>). Many influenza pandemics in history were related to reassortment, including the Asian H2N2 influenza in 1957, the Hong Kong H3N2 influenza in 1968, and the 2009 H1N1 global influenza pandemic. The H7N9 avian influenza virus that broke out in 2013 was also reassorted from different viruses according to the study (<xref ref-type="bibr" rid="B4">4</xref>&#x02013;<xref ref-type="bibr" rid="B6">6</xref>). Therefore, studying the determination and nature of influenza A virus reassortment is essential for understanding the generation of pandemic strains and the spread of viruses across species.</p>
<p>Reassortment detection is the first step in the study of influenza A virus reassortment. Due to the different evolutionary histories from different viral gene segments, reassortment can be detected by comparing the inconsistencies in the phylogenetic relationship between different segments of the reassortant virus genome (<xref ref-type="bibr" rid="B7">7</xref>&#x02013;<xref ref-type="bibr" rid="B10">10</xref>). However, this method is impractical for studying large-scale influenza A virus data sets. On the one hand, the cost of building a phylogenetic tree will increase exponentially with the growth of data. On the other hand, for viruses with complex reassortment history, this method is also difficult to infer the actual situation. Therefore, several methods for automatic detection of reassortment have been proposed. These methods can be roughly divided into two categories: phylogenetic methods and distance methods. In the phylogenetic method (<xref ref-type="bibr" rid="B11">11</xref>), proposed FluReF, which searched the full phylogenetic tree from bottom to top to select candidate reassortment groups and determined candidates that satisfied the preset threshold and resulted in inconsistencies between the segment trees. Nagarajan and Kingsford (<xref ref-type="bibr" rid="B12">12</xref>) proposed a reassortment finder GiRaF based on graph incompatibility. This algorithm was based on an earlier method (<xref ref-type="bibr" rid="B13">13</xref>), which used a fast search algorithm to mine phylogenetic inconsistencies by constructing an incompatibility graph. GiRaF then used the phylogenetic distance test to increase the false positive rate and combined the results of all fragments of the genome to generate a comprehensive reassortment catalog. In the distance method (<xref ref-type="bibr" rid="B14">14</xref>), estimated that the two strains did not have the possibility of reassortment based on the Hamming distance between different segments. De Silva et al. (<xref ref-type="bibr" rid="B15">15</xref>) reported an algorithm based on strain neighborhood. They found the closest set of strains from the reference set for each segment and compared the results between different segments to identify reassortment. In general, the phylogenetic method is more reliable than the distance method, but its cost is higher and depends on the accuracy of the constructed phylogenetic tree, which is not suitable for large-scale data sets.</p>
<p>In this article, we proposed a phylogeny-independent reassortment detection method. It does not need to perform multiple sequence alignment or construct a phylogenetic tree. We expressed the sequence as a feature vector and used the clustering method of self-organizing map to cluster the sequence of each segment. After uniformly naming the type of each segment of the virus, it becomes very simple to identify the reassortment. We used this method to detect the overall reassortment for viruses in Asia, and performed a statistical analysis of the identified reassortment events to dig out the reassortment determinations and patterns. Our results showed that the algorithm can identify reassortment events reported in previous studies and reveal the complex reassortment history in Asia. Therefore, our method can effectively perform reassortment analysis on large-scale data sets.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and Methods</title>
<sec>
<title>Data Processing</title>
<p>To study the reassortment pattern in Asia as comprehensively as possible, we assembled all the sequences from the Influenza Virus Resources at the National Centre for Biotechnology Information (NCBI) (<ext-link ext-link-type="uri" xlink:href="https://ftp.ncbi.nih.gov/genomes/INFLUENZA/">https://ftp.ncbi.nih.gov/genomes/INFLUENZA/</ext-link>). The sequences sampled in Asia were then extracted. The sequences we downloaded are coding sequences. For each segment, we only consider the longest coding sequence. We deleted sequences with illegal characters in the codon region or incomplete length. Sequences without clear epidemiological information were also deleted. We did not consider the laboratory sequences. The genome of a virus would be preserved only when eight segment sequences met the above standards. After that, we obtained 7,075 genomes of IAVs. The distribution of the number of viruses in each subtype was shown in <xref ref-type="fig" rid="F1">Figure 1A</xref>. There are a large number of IAVs with H1N1 and H3N2 subtypes, both exceeding 1,000 strains. In the distribution of the host (<xref ref-type="fig" rid="F1">Figure 1B</xref>), viruses that infected humans, waterfowl, domestic birds, and swine account for the vast majority.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>(A)</bold> The distribution of the number of viruses in each subtype. <bold>(B)</bold> The distribution of the number of viruses in each host.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fviro-01-751196-g0001.tif"/>
</fig>
</sec>
<sec>
<title>Feature Extraction</title>
<p>Based on the distance measure DMk proposed by Wei et al. (<xref ref-type="bibr" rid="B16">16</xref>), we introduced our feature extraction method for each segment sequence. A segment sequence is composed of 64 kinds of codons arranged in order. Since a codon may appear multiple times in the sequence, we can record the position of each occurrence. All the occurrence positions can form an array, recorded as {<sub><italic>p</italic><sub>0</sub>, <italic>p</italic>1</sub>, <italic>p</italic><sub>2</sub>, &#x022EF;&#x02009;, <italic>p</italic><sub><italic>n</italic></sub>}. In order to facilitate the calculation of the interval, the position at the 0th occurrence <italic>p</italic><sub>0</sub> &#x0003D; 0 is added to the position sequence. Then we used the reciprocal of the interval between each occurrence and the previous occurrence as its occurrence density, calculated as</p>
<disp-formula id="E1"><mml:math id="M1"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>-</mml:mo><mml:msub><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>-</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:mfrac></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>Where <italic>p</italic><sub><italic>i</italic></sub> represents the position of the i th occurrence of the codon, and <italic>p</italic><sub><italic>i</italic>&#x02212;1</sub> represents the position of the i-1 th occurrence of the codon. <italic>d</italic><sub><italic>i</italic></sub> reflects the interval, or density, between the i th occurrence and the i-1 th occurrence of the codon. In order to describe the order of the density array, we accumulated the density array to obtain the partial sum array, calculated as:</p>
<disp-formula id="E2"><mml:math id="M2"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:msub><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>The partial sum array is calculated directly based on the density array, for example, <italic>s</italic><sub>1</sub> &#x0003D; <italic>d</italic><sub>1</sub>, <italic>s</italic><sub>2</sub> &#x0003D; <italic>d</italic><sub>1</sub>&#x0002B;<italic>d</italic><sub>2</sub>, and so on. This array is only determined by the occurrence position of the codon, and the position of the codon can be reversed based on the array. Shannon entropy reflects the order relationship of the elements in the sequence. In order to calculate Shannon entropy, we constructed a discrete probability distribution <italic>Q</italic> &#x0003D; {<italic>q</italic><sub>1</sub>, <italic>q</italic><sub>2</sub>, &#x022EF;&#x02009;, <italic>q</italic><sub><italic>n</italic></sub>}, where each probability is calculated as <inline-formula><mml:math id="M3"><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>/</mml:mo><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>j</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover><mml:msub><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>. Then the Shannon entropy can be calculated as:</p>
<disp-formula id="E3"><mml:math id="M4"><mml:mtable columnalign="left"><mml:mtr><mml:mtd><mml:mi>H</mml:mi><mml:mo>=</mml:mo><mml:mo>-</mml:mo><mml:mstyle displaystyle="true"><mml:munderover accentunder="false" accent="false"><mml:mrow><mml:mo>&#x02211;</mml:mo></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover></mml:mstyle><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mtext>&#x000A0;</mml:mtext><mml:mi>l</mml:mi><mml:mi>o</mml:mi><mml:msub><mml:mrow><mml:mi>g</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mtext>&#x000A0;</mml:mtext><mml:msub><mml:mrow><mml:mi>q</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mtd></mml:mtr></mml:mtable></mml:math></disp-formula>
<p>For each codon, we can calculate a Shannon entropy, and the Shannon entropy of all codons finally constitutes a feature vector. In the actual process, we removed the feature of 3 stop codons, and finally got a 61-dimensional vector for each segment sequence.</p>
</sec>
<sec>
<title>SOM-Based Clustering</title>
<p>In this section, we proposed a sequence clustering method based on the self-organizing map (SOM). SOM is an unsupervised artificial neural network. Different from the general neural network training based on the reverse transfer of the loss function, it uses a competitive learning strategy and relies on the competition between neurons to gradually optimize the network. The neighbor relationship function is used to maintain the topological structure of the input space. In our clustering method, the algorithm takes the 61-dimensional vectors extracted from the segment sequences as input and maps them to the nodes of the two-dimensional grid. Segment sequences with high similarity in the input space will be mapped to the same node. We used the minisom library to implement our algorithm. First, we calculated the number of nodes in the output layer according to the empirical formula of clustering <inline-formula><mml:math id="M5"><mml:mi>n</mml:mi><mml:mo>=</mml:mo><mml:mn>5</mml:mn><mml:msqrt><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:msqrt></mml:math></inline-formula>, where N is the number of genomes. The size of the output layer is <inline-formula><mml:math id="M6"><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>z</mml:mi><mml:mi>e</mml:mi><mml:mo>=</mml:mo><mml:msqrt><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msqrt></mml:math></inline-formula>. The calculations above were rounded up. Then we initialize the SOM algorithm according to the following parameters: the output layer size was set to 61; the sigma parameter was set to 2; the learning rate was set to 1, and the neighborhood function was set to triangle; weight initialization method was set to PCA. The feature vector of each sequence was trained iteratively. After training, each vector was input to the SOM network and the winning node was the clustering type of the virus segment. Then we calculated the contour coefficient of the clustering result and recorded the corresponding parameters. Finally, we changed the parameters and repeated clustering. The clustering result with the highest contour coefficient was regarded as our final result for the segment clustering.</p>
</sec>
<sec>
<title>Reassortment Detection</title>
<p>Based on our clustering for each segment, we assigned a number x to each type and recorded it as segment_x. The virus sequences contained in each type were considered to have the same segmental ancestors. Therefore, if the eight segment types of a virus can be combined from segment types of other viruses, this virus may be produced by the reassortment of these viruses. There may be a situation where different combinations of multiple viruses can produce the eight segment types of the virus. For example, the eight segment types of virus A may be combined from segment types of virus B and virus C, or combined from segment types of virus D and virus E. Then we need to consider which combination is more likely to produce A by reassortment. To this end, we considered epidemiological information of the viruses such as host, location, and time. For viruses with multiple reassortment possibilities, we thought viruses with the similar host, location, and time are more likely to reassort. Our non-phylogeny-dependent reassortment detection method was shown in <xref ref-type="fig" rid="F2">Figure 2</xref>.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>Reassortment detection framework. Each segment sequence was represented as a 61-dimensional feature vector and was input to SOM for clustering. The genotype was defined and reassortment detection was performed combined with the epidemiological information.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fviro-01-751196-g0002.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Virus Similarity Network</title>
<p>Based on the feature vectors extracted from each sequence, we represented the IAV genome as a 488-dimensional feature vector composed of eight segment feature vectors. In this way, the similarity of the IAV genome can be characterized by the similarity of feature vectors. We then constructed a similarity matrix of all IAVs and used it to construct a similarity network. The minimum spanning tree algorithm was used to simplify our network, and the cys layout in cystoscope was used for display, which was shown in <xref ref-type="fig" rid="F2">Figure 2</xref>. In the virus similarity network, the subtypes of different virus genomes have been clearly distinguished (<xref ref-type="fig" rid="F3">Figure 3A</xref>), which proves that the feature vector we extracted is reasonable. It should be noted that swine is a mixed vessel, which connected the genome of the avian influenza virus and the genome of the human infected influenza virus (<xref ref-type="fig" rid="F3">Figure 3B</xref>). We also found that some human infected virus at the top of the figure. The genomes of these viruses were similar to those of domestic birds. Therefore, domestic birds also play an important role in the process of the avian influenza virus infecting humans.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Virus similarity network. <bold>(A)</bold> Different subtypes are represented by different colors. Viruses with the same subtype are clustered. <bold>(B)</bold> Different hosts are represented by different colors. Swine and domestic birds play an important role in human infection with avian influenza virus. The blue nodes in the middle represent swine hosts. Above these swine nodes are almost all avian host nodes (yellow-domesitic birds, purple-land birds, light blue-shorebirds, green-waterfowl), and below these swine hosts are almost all human host nodes (red). This implied that swine plays the role of an intermediate host between these avian host and human host. At the top of <bold>(B)</bold>, a small number of human host nodes can be found clustered. These nodes are close to the domestic birds node (yellow). Therefore, domestic birds also play an important role in the avian influenza viruses&#x00027; cross-species and infecting humans. Avian waterfowls were considered as the natural hosts of IAVs, domestic birds and swine may have played an important role as incubation for the IAVs&#x00027; transmission to humans.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fviro-01-751196-g0003.tif"/>
</fig>
</sec>
<sec>
<title>Segment Clustering Result</title>
<p>Using our feature extraction and SOM-based clustering method, we divided eight segments of influenza A virus into different types, respectively, which was shown in <xref ref-type="table" rid="T1">Table 1</xref>. According to the combination of hemagglutinin (HA) and neuraminidase (NA) proteins on the surface, the influenza A virus can be divided into different subtypes. At present, HA can be divided into 18 subtypes (H1-H18), NA can be divided into 11 subtypes (N1-N11). Therefore, segments with the same subtype should be grouped when we cluster HA and NA segments. Based on this, we checked the clustering results of HA and NA segments, which were shown in <xref ref-type="fig" rid="F4">Figure 4A</xref>. Each type contained only one subtype and the same subtypes were clustered together, indicating that our clustering method has no problem in distinguishing between subtypes. We also analyzed the number of types corresponding to different HA and NA subtypes, which was shown in <xref ref-type="fig" rid="F4">Figure 4B</xref>. For HA subtypes, the number of types in H1, H3, H5, and H9 is relatively large, indicating that the lineages of these subtypes are complex. For NA subtypes, there are relatively more types in N1 and N2. The clustering results for all segments can be found in <xref ref-type="supplementary-material" rid="SM1">Supplementary Tables 1</xref>&#x02013;<xref ref-type="supplementary-material" rid="SM8">8</xref>.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>The number of types for each segment.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Segment</bold></th>
<th valign="top" align="center"><bold>No. of types</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">PB2</td>
<td valign="top" align="center">415</td>
</tr>
<tr>
<td valign="top" align="left">PB1</td>
<td valign="top" align="center">421</td>
</tr>
<tr>
<td valign="top" align="left">PA</td>
<td valign="top" align="center">419</td>
</tr>
<tr>
<td valign="top" align="left">HA</td>
<td valign="top" align="center">387</td>
</tr>
<tr>
<td valign="top" align="left">NP</td>
<td valign="top" align="center">417</td>
</tr>
<tr>
<td valign="top" align="left">NA</td>
<td valign="top" align="center">376</td>
</tr>
<tr>
<td valign="top" align="left">MP</td>
<td valign="top" align="center">402</td>
</tr>
<tr>
<td valign="top" align="left">NS</td>
<td valign="top" align="center">410</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>The clustering result for HA and NA segments. <bold>(A)</bold> The circles represent the clustering types. The number in the circle represents the number of segments contained in the type. Different subtypes are represented by different colors. If a type contains multiple subtypes, the circle will be divided into different parts with different colors. <bold>(B)</bold> The number of types corresponding to different HA and NA subtypes.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fviro-01-751196-g0004.tif"/>
</fig>
</sec>
<sec>
<title>Statistic of Reassortment Subtype</title>
<p>We performed reassortment detection on all the viruses in the dataset one by one in the order of their sampling time and identified 516 reassortment events. The details of each reassortment event can be found in <xref ref-type="supplementary-material" rid="SM9">Supplementary Table 9</xref>. According to the virus subtypes involved in reassortment, we divided reassortment events into intra-subtype reassortment and inter-subtype reassortment. Intra-subtype reassortment means that the subtype involved in reassortment is single, while inter-subtype reassortment means that the subtypes involved in reassortment are diverse. We analyzed the number of two reassortment patterns and found that the intra-subtype reassortment pattern was more common, which was shown in <xref ref-type="fig" rid="F5">Figure 5A</xref>. In particular, we analyzed the situation of two reassortment patterns of eight common subtypes including H1N1, H3N2, H5N1, H5N6, H6N2, H6N6, H7N9, and H9N2, which was shown in <xref ref-type="fig" rid="F5">Figure 5B</xref>. Viruses with H1N1, H3N2, H9N2 subtypes had a higher proportion of intra-subtype reassortment, while viruses with H5N1, H5N6, H6N2, H6N6, and H7N9 subtypes were more likely to be produced by reassortment of viruses with different subtypes.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p><bold>(A)</bold> The number of intra-subtype reassortment and inter-subtype reassortment. <bold>(B)</bold> Statistic of all reassortment events, intra-reassortment events and inter-subtype reassortment events for H1N1, H3N2, H5N1, H5N6, H6N2, H6N6, H7N9, and H9N2.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fviro-01-751196-g0005.tif"/>
</fig>
</sec>
<sec>
<title>Inter-subtype Reassortment Pattern</title>
<p>Although the intra-subtype reassortment pattern was frequent, we were more concerned about inter-subtype reassortment, since such reassortment pattern is more likely to produce pandemic strains. To this end, we made statistics on the frequency of other subtypes in the inter-subtype reassortment events of each subtype. We found that there were strong reassortment signals between H1N1 and H3N2, H6N2 and H6N6, H9N2, and other subtypes, which was shown in <xref ref-type="fig" rid="F6">Figure 6</xref>. H1N1 and H3N2 are common subtypes of human influenza viruses. The viruses with these two subtypes circulate seasonally every year, leading to frequent reassortment. The 2009 H1N1 pandemic is a typical example. The virus that caused this pandemic was a triple-reassorted strain whose genome is derived from H1N1 avian virus, H1N1 classical swine virus, and H3N2 human seasonal virus. We also noticed the reassortment relationship between H6N2 and H6N6. There were few subtypes related to H6N6 reassortment and more subtypes related to H6N2 reassortment. However, the reassortment association between the two subtypes was still much more than other subtypes. In 2011, the H6N6 avian influenza virus was isolated from swine in Guangdong Province, China (<xref ref-type="bibr" rid="B17">17</xref>), suggesting that the H6 subtype avian influenza virus has the potential to infect mammals and even humans. Therefore, the reassortment between H6N2 and H6N6 needs to be further monitored. It should be noted that we found H9N2 played an important role in the reassortment of other subtypes since its proportion was the first or second. Based on this, we analyzed the specific reassortment relationship between H9N2 and other subtypes.</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p>The occurrence frequency of other subtypes in the inter-subtype reassortment event of a specific subtype (H1N1, H3N2, H5N1, H5N6, H6N2, H6N6, H7N9, and H9N2).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fviro-01-751196-g0006.tif"/>
</fig>
</sec>
<sec>
<title>Reassortment Pattern Related to H9N2</title>
<p>H9N2 avian influenza virus spreads worldwide and is widespread in poultry in Asia (<xref ref-type="bibr" rid="B18">18</xref>&#x02013;<xref ref-type="bibr" rid="B20">20</xref>). A recent study has shown that H9N2 had replaced H5N6 and H7N9 as the dominant avian influenza virus subtype in chickens and ducks in China (<xref ref-type="bibr" rid="B21">21</xref>). At the same time, there is also evidence that H9N2 contributed to the emergence and evolution of human infection with avian influenza viruses such as H7N9, H10N8, and H5N6 (<xref ref-type="bibr" rid="B22">22</xref>&#x02013;<xref ref-type="bibr" rid="B24">24</xref>). In our study, we found that H9N2 provided internal segments for viruses with other subtypes. Among 61 inter-subtype reassortments related to H9N2, 27 events were H9N2 providing internal segments for H7N9. We also found four cases of H9N2 providing internal segments for H10N8 and four cases of H9N2 providing internal segments for H5N1. H9N2 occasionally provided internal segments for H5N2, H6N2, H6N6, H3N8, and H1N2. In addition, we found that these subtypes also provided internal segments for H9N2. These H9N2 viruses that obtained internal segments from other subtypes returned to the H9N2 gene pool and provided segments for subsequent reassortment. In general, the reassortment pattern related to H9N2 is complicated. It can provide internal segments for other subtypes, and can also obtain internal segments from other subtypes.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>With the continuous improvement of sequencing technology and reduction of sequencing costs, the number of sequences in the influenza virus database is rapidly increasing. The rapid growth of data drives the continuous advancement of analytical techniques. Although manual and semi-automatic methods are generally considered to produce standard results, they also have scalability and repeatability issues (<xref ref-type="bibr" rid="B12">12</xref>), and cannot cope with the challenges brought by data growth. In the automated method of reassortment detection, the phylogenetic method requires multiple sequence alignment and reconstruction of the phylogenetic tree to perform subsequent reassortment detection tasks. De Silva et al. (<xref ref-type="bibr" rid="B15">15</xref>) tried to use GiRaF (<xref ref-type="bibr" rid="B12">12</xref>) to reconstruct the phylogenetic map, they found that the calculation time was at least several months per segment. Therefore, we inevitably need to adopt methods that have nothing to do with phylogeny. The method proposed by Rabadan et al. (<xref ref-type="bibr" rid="B14">14</xref>) seemed to perform well in detecting reassortants within the pedigree, but cannot point out the specific source of reassortment. The method of de Silva et al. (<xref ref-type="bibr" rid="B15">15</xref>) found some well-supported candidate reassortants, but it depends on the size of its neighborhood, and different neighborhood sizes may lead to different results. In our work, we proposed a new phylogeny-independent method for automatic detection of reassortment. It can efficiently process large-scale data sets while studying the source of all segments of the influenza A virus genome to identify reassortment.</p>
<p>In our reassortment detection results, although there is no evidence that every reassortment event we detected exists, as a whole, the reassortment history and patterns reflected in our results can be supported by the relevant literature. According to reports, the reassortment between strains belonging to a single subtype may occur more frequently than inter-subtype reassortment (<xref ref-type="bibr" rid="B25">25</xref>), which can be found in our results (<xref ref-type="fig" rid="F5">Figure 5</xref>). In our analysis of the reassortment related to the H9N2 subtype, we found a reassortment pattern that H9N2 provided internal segments for other subtypes. This reassortment pattern has been confirmed by many researches (<xref ref-type="bibr" rid="B22">22</xref>&#x02013;<xref ref-type="bibr" rid="B24">24</xref>). In particular, in the avian influenza H7N9 virus that broke out in 2013, all internal gene segments were closely related to the gene segments of the avian influenza H9N2 virus (<xref ref-type="bibr" rid="B26">26</xref>). Related research has proposed a dynamic reassortment model of H7N9 virus evolution: H7N9 virus reassorted in the H9N2 gene pool, and was classified into different H9N2 gene pools under the promotion of poultry transportation, and undergoes further reassortment (<xref ref-type="bibr" rid="B27">27</xref>). In our early results (<xref ref-type="fig" rid="F3">Figure 3B</xref>), we also found that domestic birds played an important role in the H7N9 virus infecting humans. Subsequent analysis results also showed that H9N2 was the subtype most associated with H7N9, and it frequently provided internal segments for H7N9 by reassortment. At the same time, we found cases where H9N2 provided internal segments for H10N8. Almost all of these H10N8 viruses originated in Jiangxi, China, which coincides with the study by Wang et al. (<xref ref-type="bibr" rid="B28">28</xref>). The reassortment pattern that H9N2 provided internal segments for H5N1 can also be supported in the report (<xref ref-type="bibr" rid="B29">29</xref>). All in all, our reassortment detection method can perform reassortment detection on large-scale data sets and obtain effective conclusions.</p>
<p>Based on our method, researchers can study the reassortment pattern by detecting the reassortment of the viruses in the data set one by one. Researchers can also explore the source of each segment of the new virus without phylogenetic analysis. This can be achieved by comparing the feature vector of the new virus with the feature vector of the virus in the database. Although our reassortment detection method is applied to the influenza virus data set, this method also has a reference value for the reassortment of other segmented viruses. Our method will help automate the task of detecting influenza virus reassortment.</p>
</sec>
<sec sec-type="data-availability" id="s5">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM10">Supplementary Material</xref>, further inquiries can be directed to the corresponding author/s.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>HR, WC, and JY: formulated the study. XG and MH: performed the research and analyzed the data. BW, YJ, HY, and LL: participated in analysis and discussion. XG and HR: drafted the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>This work was supported by the National Natural Science Foundation of China (grant numbers 32070025, 31800136, and 82041019) and the Research Project from State Key Laboratory of Pathogen and Biosecurity (grant number SKLPBS1807).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x00027;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec sec-type="supplementary-material" id="s9">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fviro.2021.751196/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fviro.2021.751196/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM1" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 1</label>
<caption><p>The clustering results for PB2 segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM2" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 2</label>
<caption><p>The clustering results for PB1 segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM3" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 3</label>
<caption><p>The clustering results for PA segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM4" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 4</label>
<caption><p>The clustering results for HA segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM5" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 5</label>
<caption><p>The clustering results for NP segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM6" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 6</label>
<caption><p>The clustering results for NA segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM7" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 7</label>
<caption><p>The clustering results for MP segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM8" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 8</label>
<caption><p>The clustering results for NS segments.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM9" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 9</label>
<caption><p>The details of each reassortment event.</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM10" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary File</label>
<caption><p>AsiaGenome.zip (Genome data used in this paper).</p></caption> </supplementary-material>
<supplementary-material xlink:href="Data_Sheet_2.PDF" id="SM11" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_3.xlsx" id="SM12" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Taubenberger</surname> <given-names>JK</given-names></name> <name><surname>Kash</surname> <given-names>JC</given-names></name></person-group>. <article-title>Influenza virus evolution, host adaptation, pandemic formation</article-title>. <source>Cell Host Microbe.</source> (<year>2010</year>) <volume>7</volume>:<fpage>440</fpage>&#x02013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1016/j.chom.2010.05.009</pub-id><pub-id pub-id-type="pmid">20542248</pub-id></citation></ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marshall</surname> <given-names>N</given-names></name> <name><surname>Priyamvada</surname> <given-names>L</given-names></name> <name><surname>Ende</surname> <given-names>Z</given-names></name> <name><surname>Steel</surname> <given-names>J</given-names></name> <name><surname>Lowen</surname> <given-names>AC</given-names></name></person-group>. <article-title>Influenza virus reassortment occurs with high frequency in the absence of segment mismatch</article-title>. <source>PLoS Pathog.</source> (<year>2013</year>) <volume>9</volume>:<fpage>e1003421</fpage>. <pub-id pub-id-type="doi">10.1371/journal.ppat.1003421</pub-id><pub-id pub-id-type="pmid">23785286</pub-id></citation></ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vijaykrishna</surname> <given-names>D</given-names></name> <name><surname>Mukerji</surname> <given-names>R</given-names></name> <name><surname>Smith</surname> <given-names>GJ</given-names></name></person-group>. <article-title>RNA virus reassortment: an evolutionary mechanism for host jumps and immune evasion</article-title>. <source>PLoS Pathog.</source> (<year>2015</year>) <volume>11</volume>:<fpage>e1004902</fpage>. <pub-id pub-id-type="doi">10.1371/journal.ppat.1004902</pub-id><pub-id pub-id-type="pmid">26158697</pub-id></citation></ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>R</given-names></name> <name><surname>Cao</surname> <given-names>B</given-names></name> <name><surname>Hu</surname> <given-names>Y</given-names></name> <name><surname>Feng</surname> <given-names>Z</given-names></name> <name><surname>Wang</surname> <given-names>D</given-names></name> <name><surname>Hu</surname> <given-names>W</given-names></name> <etal/></person-group>. <article-title>Human infection with a novel avian-origin influenza A (H7N9) virus</article-title>. <source>N Engl J Med.</source> (<year>2013</year>) <volume>368</volume>:<fpage>1888</fpage>&#x02013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMoa1304459</pub-id><pub-id pub-id-type="pmid">24931229</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kageyama</surname> <given-names>T</given-names></name> <name><surname>Fujisaki</surname> <given-names>S</given-names></name> <name><surname>Takashita</surname> <given-names>E</given-names></name> <name><surname>Xu</surname> <given-names>H</given-names></name> <name><surname>Yamada</surname> <given-names>S</given-names></name> <name><surname>Uchida</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>Genetic analysis of novel avian A(H7N9) influenza viruses isolated from patients in China, February to April 2013</article-title>. <source>Euro Surveill.</source> (<year>2013</year>) <volume>18</volume>:<fpage>20453</fpage>. <pub-id pub-id-type="doi">10.2807/ese.18.15.20453-en</pub-id><pub-id pub-id-type="pmid">23594575</pub-id></citation></ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lam</surname> <given-names>TT</given-names></name> <name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Shen</surname> <given-names>Y</given-names></name> <name><surname>Zhou</surname> <given-names>B</given-names></name> <name><surname>Duan</surname> <given-names>L</given-names></name> <name><surname>Cheung</surname> <given-names>CL</given-names></name> <etal/></person-group>. <article-title>The genesis and source of the H7N9 influenza viruses causing human infections in China</article-title>. <source>Nature.</source> (<year>2013</year>) <volume>502</volume>:<fpage>241</fpage>&#x02013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1038/nature12515</pub-id><pub-id pub-id-type="pmid">23965623</pub-id></citation></ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lindstrom</surname> <given-names>SE</given-names></name> <name><surname>Hiromoto</surname> <given-names>Y</given-names></name> <name><surname>Nerome</surname> <given-names>R</given-names></name> <name><surname>Omoe</surname> <given-names>K</given-names></name> <name><surname>Sugita</surname> <given-names>S</given-names></name> <name><surname>Yamazaki</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>Phylogenetic analysis of the entire genome of influenza A (H3N2) viruses from Japan: evidence for genetic reassortment of the six internal genes</article-title>. <source>J Virol.</source> (<year>1998</year>) <volume>72</volume>:<fpage>8021</fpage>&#x02013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1128/JVI.72.10.8021-8031.1998</pub-id><pub-id pub-id-type="pmid">9733841</pub-id></citation></ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nelson</surname> <given-names>MI</given-names></name> <name><surname>Viboud</surname> <given-names>C</given-names></name> <name><surname>Simonsen</surname> <given-names>L</given-names></name> <name><surname>Bennett</surname> <given-names>RT</given-names></name> <name><surname>Griesemer</surname> <given-names>SB</given-names></name> <name><surname>St George</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Multiple reassortment events in the evolutionary history of H1N1 influenza A virus since 1918</article-title>. <source>PLoS Pathog.</source> (<year>2008</year>) <volume>4</volume>:<fpage>e1000012</fpage>. <pub-id pub-id-type="doi">10.1371/journal.ppat.1000012</pub-id><pub-id pub-id-type="pmid">18463694</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Holmes</surname> <given-names>EC</given-names></name> <name><surname>Ghedin</surname> <given-names>E</given-names></name> <name><surname>Miller</surname> <given-names>N</given-names></name> <name><surname>Taylor</surname> <given-names>J</given-names></name> <name><surname>Bao</surname> <given-names>Y</given-names></name> <name><surname>St George</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Whole-genome analysis of human influenza A virus reveals multiple persistent lineages and reassortment among recent H3N2 viruses</article-title>. <source>PLoS Biol.</source> (<year>2005</year>) <volume>3</volume>:<fpage>e300</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pbio.0030300</pub-id><pub-id pub-id-type="pmid">16026181</pub-id></citation></ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Westgeest</surname> <given-names>KB</given-names></name> <name><surname>Russell</surname> <given-names>CA</given-names></name> <name><surname>Lin</surname> <given-names>X</given-names></name> <name><surname>Spronken</surname> <given-names>MI</given-names></name> <name><surname>Bestebroer</surname> <given-names>TM</given-names></name> <name><surname>Bahl</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>Genomewide analysis of reassortment and evolution of human influenza A(H3N2) viruses circulating between 1968 and 2011</article-title>. <source>J Virol.</source> (<year>2014</year>) <volume>88</volume>:<fpage>2844</fpage>&#x02013;<lpage>57</lpage>. <pub-id pub-id-type="doi">10.1128/JVI.02163-13</pub-id><pub-id pub-id-type="pmid">24371052</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Yurovsky</surname> <given-names>Moret ABM</given-names></name></person-group>. <article-title>FluReF, an automated flu virus reassortment finder based on phylogenetic trees</article-title>. <source>BMC Genomics</source>. (<year>2011</year>) <volume>12</volume>(<supplement>Suppl. 2</supplement>):<fpage>S3</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-12-S2-S3</pub-id><pub-id pub-id-type="pmid">21989112</pub-id></citation></ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nagarajan</surname> <given-names>N</given-names></name> <name><surname>Kingsford</surname> <given-names>C</given-names></name></person-group>. <article-title>GiRaF: robust, computational identification of influenza reassortments via graph mining</article-title>. <source>Nucleic Acids Res.</source> (<year>2011</year>) <volume>39</volume>:<fpage>e34</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkq1232</pub-id><pub-id pub-id-type="pmid">21177643</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Nagarajan</surname> <given-names>N</given-names></name> <name><surname>Kingsford</surname> <given-names>C</given-names></name></person-group>. <article-title>Uncovering genomic reassortments among influenza strains by enumerating maximal bicliques</article-title>. In: <source>2008 IEEE International Conference on Bioinformatics and Biomedicine</source>. <publisher-loc>Los Alamitos, CA</publisher-loc> (<year>2008</year>). p. <fpage>223</fpage>&#x02013;<lpage>30</lpage>.</citation>
</ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rabadan</surname> <given-names>R</given-names></name> <name><surname>Levine</surname> <given-names>AJ</given-names></name> <name><surname>Krasnitz</surname></name></person-group>. <article-title>Non-random reassortment in human influenza A viruses</article-title>. <source>Influenza Other Respir Viruses.</source> (<year>2008</year>) <volume>2</volume>:<fpage>9</fpage>&#x02013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1111/j.1750-2659.2007.00030.x</pub-id><pub-id pub-id-type="pmid">19453489</pub-id></citation></ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>de Silva</surname> <given-names>UC</given-names></name> <name><surname>Tanaka</surname> <given-names>H</given-names></name> <name><surname>Nakamura</surname> <given-names>S</given-names></name> <name><surname>Goto</surname> <given-names>N</given-names></name> <name><surname>Yasunaga</surname> <given-names>T</given-names></name></person-group>. <article-title>A comprehensive analysis of reassortment in influenza A virus</article-title>. <source>Biol Open.</source> (<year>2012</year>) <volume>1</volume>:<fpage>385</fpage>&#x02013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1242/bio.2012281</pub-id><pub-id pub-id-type="pmid">23213428</pub-id></citation></ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>D</given-names></name> <name><surname>Jiang</surname> <given-names>Q</given-names></name> <name><surname>Wei</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>S</given-names></name></person-group>. <article-title>A novel hierarchical clustering algorithm for gene sequences</article-title>. <source>BMC Bioinformatics.</source> (<year>2012</year>) <volume>13</volume>:<fpage>174</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-13-174</pub-id><pub-id pub-id-type="pmid">22823405</pub-id></citation></ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>G</given-names></name> <name><surname>Kong</surname> <given-names>W</given-names></name> <name><surname>Qi</surname> <given-names>W</given-names></name> <name><surname>Long</surname> <given-names>LP</given-names></name> <name><surname>Cao</surname> <given-names>Z</given-names></name> <name><surname>Huang</surname> <given-names>L</given-names></name> <etal/></person-group>. <article-title>Identification of an H6N6 swine influenza virus in southern China</article-title>. <source>Infect Genet Evol.</source> (<year>2011</year>) <volume>11</volume>:<fpage>1174</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1016/j.meegid.2011.02.023</pub-id><pub-id pub-id-type="pmid">21382518</pub-id></citation></ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Panshin</surname> <given-names>A</given-names></name> <name><surname>Golender</surname> <given-names>N</given-names></name> <name><surname>Davidson</surname> <given-names>I</given-names></name> <name><surname>Nagar</surname> <given-names>S</given-names></name> <name><surname>Garsia</surname> <given-names>M</given-names></name> <name><surname>Jackwood</surname> <given-names>MW</given-names></name> <etal/></person-group>. <article-title>Variability of NS1 proteins among H9N2 avian influenza viruses isolated in Israel during 2000-2009</article-title>. <source>Virus Genes.</source> (<year>2010</year>) <volume>41</volume>:<fpage>396</fpage>&#x02013;<lpage>405</lpage>. <pub-id pub-id-type="doi">10.1007/s11262-010-0522-3</pub-id><pub-id pub-id-type="pmid">20721688</pub-id></citation></ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>Y</given-names></name> <name><surname>Pu</surname> <given-names>J</given-names></name> <name><surname>Jiang</surname> <given-names>Z</given-names></name> <name><surname>Guan</surname> <given-names>T</given-names></name> <name><surname>Xia</surname> <given-names>Y</given-names></name> <name><surname>Xu</surname> <given-names>Q</given-names></name> <etal/></person-group>. <article-title>Genotypic evolution and antigenic drift of H9N2 influenza viruses in China from 1994 to 2008</article-title>. <source>Vet Microbiol.</source> (<year>2010</year>) <volume>146</volume>:<fpage>215</fpage>&#x02013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1016/j.vetmic.2010.05.010</pub-id><pub-id pub-id-type="pmid">20685047</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>KM</given-names></name> <name><surname>Smith</surname> <given-names>GJ</given-names></name> <name><surname>Bahl</surname> <given-names>J</given-names></name> <name><surname>Duan</surname> <given-names>L</given-names></name> <name><surname>Tai</surname> <given-names>H</given-names></name> <name><surname>Vijaykrishna</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>The genesis and evolution of H9N2 influenza viruses in poultry from southern China, 2000 to 2005</article-title>. <source>J Virol.</source> (<year>2007</year>) <volume>81</volume>:<fpage>10389</fpage>&#x02013;<lpage>401</lpage>. <pub-id pub-id-type="doi">10.1128/JVI.00979-07</pub-id><pub-id pub-id-type="pmid">17652402</pub-id></citation></ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bi</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>J</given-names></name> <name><surname>Li</surname> <given-names>S</given-names></name> <name><surname>Fu</surname> <given-names>G</given-names></name> <name><surname>Jin</surname> <given-names>T</given-names></name> <name><surname>Zhang</surname> <given-names>C</given-names></name> <etal/></person-group>. <article-title>Dominant subtype switch in avian influenza viruses during 2016-2019 in China</article-title>. <source>Nat Commun.</source> (<year>2020</year>) <volume>11</volume>:<fpage>5909</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-19671-3</pub-id><pub-id pub-id-type="pmid">33219213</pub-id></citation></ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>D</given-names></name> <name><surname>Shi</surname> <given-names>W</given-names></name> <name><surname>Gao</surname> <given-names>GF</given-names></name></person-group>. <article-title>Poultry carrying H9N2 act as incubators for novel human avian influenza viruses</article-title>. <source>Lancet.</source> (<year>2014</year>) <volume>383</volume>:<fpage>869</fpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(14)60386-X</pub-id><pub-id pub-id-type="pmid">24581684</pub-id></citation></ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pu</surname> <given-names>J</given-names></name> <name><surname>Wang</surname> <given-names>S</given-names></name> <name><surname>Yin</surname> <given-names>Y</given-names></name> <name><surname>Zhang</surname> <given-names>G</given-names></name> <name><surname>Carter</surname> <given-names>RA</given-names></name> <name><surname>Wang</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>Evolution of the H9N2 influenza genotype that facilitated the genesis of the novel H7N9 virus</article-title>. <source>Proc Natl Acad Sci USA.</source> (<year>2015</year>) <volume>112</volume>:<fpage>548</fpage>&#x02013;<lpage>53</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1422456112</pub-id><pub-id pub-id-type="pmid">25548189</pub-id></citation></ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Su</surname> <given-names>S</given-names></name> <name><surname>Bi</surname> <given-names>Y</given-names></name> <name><surname>Wong</surname> <given-names>G</given-names></name> <name><surname>Gray</surname> <given-names>GC</given-names></name> <name><surname>Gao</surname> <given-names>GF</given-names></name> <name><surname>Li</surname> <given-names>S</given-names></name></person-group>. <article-title>Epidemiology, evolution, and recent outbreaks of avian influenza virus in China</article-title>. <source>J Virol.</source> (<year>2015</year>) <volume>89</volume>:<fpage>8671</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1128/JVI.01034-15</pub-id><pub-id pub-id-type="pmid">26063419</pub-id></citation></ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nelson</surname> <given-names>MI</given-names></name> <name><surname>Holmes</surname> <given-names>EC</given-names></name></person-group>. <article-title>The evolution of epidemic influenza</article-title>. <source>Nat Rev Genet.</source> (<year>2007</year>) <volume>8</volume>:<fpage>196</fpage>&#x02013;<lpage>205</lpage>. <pub-id pub-id-type="doi">10.1038/nrg2053</pub-id><pub-id pub-id-type="pmid">17262054</pub-id></citation></ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>D</given-names></name> <name><surname>Shi</surname> <given-names>W</given-names></name> <name><surname>Shi</surname> <given-names>Y</given-names></name> <name><surname>Wang</surname> <given-names>D</given-names></name> <name><surname>Xiao</surname> <given-names>H</given-names></name> <name><surname>Li</surname> <given-names>W</given-names></name> <etal/></person-group>. <article-title>Origin and diversity of novel avian influenza A H7N9 viruses causing human infection: phylogenetic, structural, coalescent analyses</article-title>. <source>Lancet.</source> (<year>2013</year>) <volume>381</volume>:<fpage>1926</fpage>&#x02013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(13)60938-1</pub-id><pub-id pub-id-type="pmid">23643111</pub-id></citation></ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cui</surname> <given-names>L</given-names></name> <name><surname>Liu</surname> <given-names>D</given-names></name> <name><surname>Shi</surname> <given-names>W</given-names></name> <name><surname>Pan</surname> <given-names>J</given-names></name> <name><surname>Qi</surname> <given-names>X</given-names></name> <name><surname>Li</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Dynamic reassortments and genetic heterogeneity of the human-infecting influenza A (H7N9) virus</article-title>. <source>Nat Commun.</source> (<year>2014</year>) <volume>5</volume>:<fpage>3142</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms4142</pub-id><pub-id pub-id-type="pmid">24457975</pub-id></citation></ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>M</given-names></name> <name><surname>Li</surname> <given-names>X</given-names></name> <name><surname>Yuan</surname> <given-names>H</given-names></name> <name><surname>Zhou</surname> <given-names>J</given-names></name> <name><surname>Wu</surname> <given-names>J</given-names></name> <name><surname>Bo</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>Genetic diversity of avian influenza A (H10N8) virus in live poultry markets and its association with human infections in China</article-title>. <source>Sci Rep.</source> (<year>2015</year>) <volume>5</volume>:<fpage>7632</fpage>. <pub-id pub-id-type="doi">10.1038/srep07632</pub-id><pub-id pub-id-type="pmid">25591167</pub-id></citation></ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guan</surname> <given-names>Y</given-names></name> <name><surname>Shortridge</surname> <given-names>KF</given-names></name> <name><surname>Krauss</surname> <given-names>S</given-names></name> <name><surname>Webster</surname> <given-names>RG</given-names></name></person-group>. <article-title>Molecular characterization of H9N2 influenza viruses: were they the donors of the &#x0201C;internal&#x0201D; genes of H5N1 viruses in Hong Kong?</article-title> <source>Proc Natl Acad Sci USA.</source> (<year>1999</year>) <volume>96</volume>:<fpage>9363</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.96.16.9363</pub-id><pub-id pub-id-type="pmid">10430948</pub-id></citation></ref>
</ref-list> 
</back>
</article>