<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Genet.</journal-id>
<journal-title>Frontiers in Genetics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Genet.</abbrev-journal-title>
<issn pub-type="epub">1664-8021</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1024577</article-id>
<article-id pub-id-type="doi">10.3389/fgene.2022.1024577</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Genetics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>ggMOB: Elucidation of genomic conjugative features and associated cargo genes across bacterial genera using genus-genus mobilization networks</article-title>
<alt-title alt-title-type="left-running-head">Nayar et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fgene.2022.1024577">10.3389/fgene.2022.1024577</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Nayar</surname>
<given-names>Gowri</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Terrizzano</surname>
<given-names>Ignacio</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Seabolt</surname>
<given-names>Ed</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Agarwal</surname>
<given-names>Akshay</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Boucher</surname>
<given-names>Christina</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/834161/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ruiz</surname>
<given-names>Jaime</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2038569/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Slizovskiy</surname>
<given-names>Ilya B.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/804146/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kaufman</surname>
<given-names>James H.</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Noyes</surname>
<given-names>Noelle R.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/564069/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Biomedical Informatics</institution>, <institution>Stanford University</institution>, <addr-line>Stanford</addr-line>, <addr-line>CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>IBM Research Almaden</institution>, <addr-line>San Jose</addr-line>, <addr-line>CA</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Department of Computer and Information Science and Engineering</institution>, <institution>University of Florida</institution>, <addr-line>Gainesville</addr-line>, <addr-line>FL</addr-line>, <country>United States</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Department of Veterinary Population Medicine</institution>, <institution>University of Minnesota</institution>, <addr-line>Minneapolis</addr-line>, <addr-line>MN</addr-line>, <country>United States</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Altos Labs</institution>, <addr-line>Redwood City</addr-line>, <addr-line>CA</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/124337/overview">Marco Pellegrini</ext-link>, National Research Council (CNR), Italy</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/399317/overview">Ahmed Moustafa</ext-link>, American University in Cairo, Egypt</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/861372/overview">Daljeet Singh Dhanjal</ext-link>, Lovely Professional University, India</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Noelle R. Noyes, <email>nnoyes@umn.edu</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Computational Genomics, a section of the journal Frontiers in Genetics</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>08</day>
<month>12</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>1024577</elocation-id>
<history>
<date date-type="received">
<day>21</day>
<month>08</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>25</day>
<month>10</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Nayar, Terrizzano, Seabolt, Agarwal, Boucher, Ruiz, Slizovskiy, Kaufman and Noyes.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Nayar, Terrizzano, Seabolt, Agarwal, Boucher, Ruiz, Slizovskiy, Kaufman and Noyes</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Horizontal gene transfer mediated by conjugation is considered an important evolutionary mechanism of bacteria. It allows organisms to quickly evolve new phenotypic properties including antimicrobial resistance (AMR) and virulence. The frequency of conjugation-mediated cargo gene exchange has not yet been comprehensively studied within and between bacterial taxa. We developed a frequency-based network of genus-genus conjugation features and candidate cargo genes from whole-genome sequence data of over 180,000 bacterial genomes, representing 1,345 genera. Using our method, which we refer to as ggMOB, we revealed that over half of the bacterial genomes contained one or more known conjugation features that matched exactly to at least one other genome. Moreover, the proportion of genomes containing these conjugation features varied substantially by genus and conjugation feature. These results and the genus-level network structure can be viewed interactively in the ggMOB interface, which allows for user-defined filtering of conjugation features and candidate cargo genes. Using the network data, we observed that the ratio of AMR gene representation in conjugative <italic>versus</italic> non-conjugative genomes exceeded 5:1, confirming that conjugation is a critical force for AMR spread across genera. Finally, we demonstrated that clustering genomes by conjugation profile sometimes correlated well with classical phylogenetic structuring; but that in some cases the clustering was highly discordant, suggesting that the importance of the accessory genome in driving bacterial evolution may be highly variable across both time and taxonomy. These results can advance scientific understanding of bacterial evolution, and can be used as a starting point for probing genus-genus gene exchange within complex microbial communities that include unculturable bacteria. ggMOB is publicly available under the GNU licence at <ext-link ext-link-type="uri" xlink:href="https://ruiz-hci-lab.github.io/ggMOB/">https://ruiz-hci-lab.github.io/ggMOB/</ext-link>
</p>
</abstract>
<kwd-group>
<kwd>antimicobial resistance</kwd>
<kwd>genomics</kwd>
<kwd>metagenomics</kwd>
<kwd>big data</kwd>
<kwd>mobile genetic elements (MGE)</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Several mechanisms of horizontal gene transfer (HGT) allow bacteria to exchange genetic material. One of these mechanisms, termed conjugation, occurs when bacterial cells form direct physical contacts that allow for passage of genetic material from one bacterium to another. The machinery required to form these contacts and initiate genetic exchange is often contained within integrative and conjugative elements (ICE), plasmids, and other mobile genetic elements (MGEs) (<xref ref-type="bibr" rid="B22">Frost et al., 2005</xref>; <xref ref-type="bibr" rid="B75">Wozniak and Waldor, 2010</xref>; <xref ref-type="bibr" rid="B54">Roberts and Mullany, 2011</xref>; <xref ref-type="bibr" rid="B74">Wiedenbeck and Cohan, 2011</xref>; <xref ref-type="bibr" rid="B49">Perry and Wright, 2013</xref>; <xref ref-type="bibr" rid="B27">Johnson and Grossman, 2015</xref>; <xref ref-type="bibr" rid="B60">Singer et al., 2016</xref>). The conditions that induce excision and conjugation are not fully elucidated, but DNA damage and subsequent SOS response seem to be an important trigger (<xref ref-type="bibr" rid="B71">Waldor et al., 2004</xref>; <xref ref-type="bibr" rid="B29">Koraimann and Wagner, 2014</xref>). The cost of acquiring and maintaining the new genetic material also influences the success of transfer events (<xref ref-type="bibr" rid="B70">Uhlemann et al., 2021</xref>).</p>
<p>Genes exchanged between bacteria during conjugation include functional domains associated with conjugative machinery (e.g., excisionases, integrases, conjugative transport proteins) as well as intervening &#x201c;accessory&#x201d; genes that are not necessary for conjugation, often termed &#x201c;cargo genes&#x201d; (<xref ref-type="bibr" rid="B27">Johnson and Grossman, 2015</xref>). By pairing conjugative machinery with an array of diverse cargo genes, bacterial communities can significantly expand their genetic repertoire, including between bacteria of diverse taxonomy (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>; <xref ref-type="bibr" rid="B6">Bellanger et al., 2014</xref>; <xref ref-type="bibr" rid="B56">Neil and Allard, 2021</xref>). Functions commonly associated with conjugative cargo include antimicrobial resistance (AMR) and virulence (<xref ref-type="bibr" rid="B54">Roberts and Mullany, 2011</xref>; <xref ref-type="bibr" rid="B49">Perry and Wright, 2013</xref>; <xref ref-type="bibr" rid="B27">Johnson and Grossman, 2015</xref>; <xref ref-type="bibr" rid="B18">Cury et al., 2017</xref>), which can pose a risk to human and animal health if transferred into pathogens (<xref ref-type="bibr" rid="B47">Partridge et al., 2018</xref>). Therefore, understanding the microbial ecology of conjugative elements and cargo genes (i.e., their distribution and behavior across bacterial taxa) is important in assessing the risk posed by various bacterial communities (<xref ref-type="bibr" rid="B24">Gaston et al., 2021</xref>). For example, how often do different bacterial taxa carry conjugative machinery and AMR genes; what resistance phenotypes are commonly associated with the presence of conjugative machinery within the genome; how often do different commensal bacterial taxa carry out conjugation to exchange cargo genes with pathogens; and what conditions foster conjugative exchange of specific cargo genes between pathogens and non-pathogens? These questions are fundamental to understanding how bacterial communities respond to external stimuli, and how these responses increase the overall risk posed by microbial communities of varying composition (<xref ref-type="bibr" rid="B35">Mart&#xed;nez et al., 2015</xref>; <xref ref-type="bibr" rid="B42">Oh et al., 2018</xref>).</p>
<p>However, the process of conjugative HGT is highly stochastic and therefore, difficult to predict (<xref ref-type="bibr" rid="B34">Lopatkin and Collin, 2020</xref>). One reason for this stochasticity is variability in the conjugation competency of donor and recipient bacterial cells for a given conjugative MGE; as well as variability in the capacity of a given type of conjugative MGE to also transfer unrelated cargo genes. Recent meta-analyses of conjugation rates for specific bacterial species and/or MGEs have highlighted these complexities (<xref ref-type="bibr" rid="B2">Alderliesten et al., 2020</xref>; <xref ref-type="bibr" rid="B59">Sheppard et al., 2020</xref>). Historically, the scientific process for estimating conjugative likelihood has stemmed from highly controlled <italic>in vitro</italic> experiments between pairs of bacterial isolates and specific MGEs. Results from such studies have been crucial for uncovering the behavior of MGEs and their importance for functions such as AMR. However, reductive experiments typically do not generalize well to the complex microbial communities found <italic>in situ</italic>, including host and environmental microbiomes. Furthermore, these experiments are necessarily restricted in their ability to characterize the full bacterial host range of a given MGE, as they typically involve only several distinct bacterial taxa. One major challenge that remains is to generate a conjugation likelihood for every host-donor-MGE combination observed across all bacterial taxa and MGE.</p>
<p>Insight into this challenge can be gained through the plethora of whole genome sequence (WGS) data which is now publicly available. As an example, the analysis of HGT-associated genes from just 336 genomes across 16 phyla was sufficient to significantly improve bacterial phylogenies as compared to those obtained from conserved marker genes (<xref ref-type="bibr" rid="B1">Abby et al., 2012</xref>). An analysis of 1,000 genomes demonstrated that ICE machinery is ubiquitous across diverse prokaryotes, and likely one of the most common mechanisms of bacterial evolution (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>). Currently, public datasets contain orders of magnitude more WGS data, which can be used to improve our understanding of the mechanisms by which critically important genes and pathogens emerge and persist (<xref ref-type="bibr" rid="B10">Botelho et al., 2020</xref>). However, despite the importance of HGT in bacterial evolution and pathogenicity, there has not yet been a comprehensive, systematic survey of the frequency of conjugation and cargo genes within or between bacterial genera. The objective of this work was to describe intra- and inter-genus conjugation-cargo dynamics by leveraging the comprehensive set of WGS data and conjugation sequences currently available within the Reference Sequence (RefSeq) and Short Read Archive (SRA) databases at the National Center for Biotechnology Information (NCBI). In particular, we analyzed 186,887 WGS datasets to identify putative conjugation events and corresponding candidate cargo genes, as well as to characterize the frequency of AMR genes with respect to the frequency of their occurrence with conjugative proteins. We were able to identify over 95,000 genomes containing conjugative proteins, and more than 4 billion putative cargo genes between genomes. We summarize and disseminate this analysis through an open-source network that describes the genus-genus sharing of conjugation features and cargo genes, representing genomes from over 1,300 different genera. Our network, which we refer to as ggMOB, allows users to filter for both conjugation features and putative cargo genes. Using ggMOB we analyzed the ratio of AMR gene representation in conjugative <italic>versus</italic> non-conjugative genomes and found it to be greater than 5:1, confirming that conjugation is a critical force for AMR spread across genera. Finally, we demonstrated that clustering genomes by conjugation profile sometimes correlated well with taxonomic structuring, but in some cases was highly discordant, suggesting that the importance of the accessory genome in driving bacterial evolution may be highly variable across genera. These results demonstrates that ggMOB can be used to further probe potential genus-genus mobilization dynamics, and thus, provide insight into conjugative mobilization between unculturable bacteria and complex interactions involving multiple genera.</p>
</sec>
<sec sec-type="results" id="s2">
<title>2 Results</title>
<sec id="s2-1">
<title>2.1 Overview of ggMOB</title>
<p>The analyses conducted in this paper were derived from an existing resource (<xref ref-type="bibr" rid="B58">Seabolt et al., 2020</xref>), which was constructed by curating and annotating 186,887 genomes from NCBI (see MATERIALS AND METHODS). Using the sequence data and annotated features obtained from over 166,000 curated and high-quality WGS datasets, we identified genomes that contained conjugative features (<xref ref-type="table" rid="T1">Table 1</xref>), which we term conjugative genomes (see MATERIALS AND METHODS). By recording counts of shared features across these conjugative genomes, we constructed ggMOB (the &#x201c;genus-genus mobilization&#x201d; network), which contains information about features that are shared between conjugative genus-genus pairs.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Conjugative features included in this study. Color label indicates the color used to represent the conjugative feature in <xref ref-type="fig" rid="F2">Figure 2</xref>. Yellow indicates a conjugative feature defined by a single IPR code and red indicates a family of codes. Genome count indicates the number of genomes that contain the conjugative feature.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Label</th>
<th align="left">Conjugative feature</th>
<th align="left">Genome count</th>
<th align="left">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx1.tif"/>
</td>
<td align="left">ICE6013</td>
<td align="left">93,267</td>
<td align="left">Includes IS30-like DDE transposase. More closely related to ICEBs1 than Tn5801 <xref ref-type="bibr" rid="B64">Smyth and Robinson. (2009)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx2.tif"/>
</td>
<td align="left">Tn916</td>
<td align="left">59,718</td>
<td align="left">TetM and other resistance genes <xref ref-type="bibr" rid="B15">Clewell et al. (1995)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx3.tif"/>
</td>
<td align="left">IPR025955</td>
<td align="left">49,841</td>
<td align="left">Type-IV secretion system protein TraC <break/>
<xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx4.tif"/>
</td>
<td align="left">ICEEc2</td>
<td align="left">49,543</td>
<td align="left">set of three genes encoding DNA mobility enzymes and type IV pilus <xref ref-type="bibr" rid="B55">Roche et al. (2010)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx5.tif"/>
</td>
<td align="left">IPR005094</td>
<td align="left">42,760</td>
<td align="left">Endonuclease relaxase, MobA, VirD2 <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx6.tif"/>
</td>
<td align="left">ICEhin1056</td>
<td align="left">42,252</td>
<td align="left">Antibiotic resistance island <xref ref-type="bibr" rid="B40">Mohd-Zain et al. (2004)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx7.tif"/>
</td>
<td align="left">IPR011119</td>
<td align="left">28,752</td>
<td align="left">Unchar. domain, putative helicase, relaxase <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx8.tif"/>
</td>
<td align="left">IPR014862</td>
<td align="left">26,295</td>
<td align="left">TrwC relaxase <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx9.tif"/>
</td>
<td align="left">IPR014059</td>
<td align="left">23,368</td>
<td align="left">Conjugative relaxase, N-terminal <xref ref-type="bibr" rid="B10">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx10.tif"/>
</td>
<td align="left">PAPI-1</td>
<td align="left">22,855</td>
<td align="left">Pathogenicity island PAPI-1 of strain PA14.115 gene cluster includes virulence phenotypes <xref ref-type="bibr" rid="B51">Qiu et al. (2006)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx11.tif"/>
</td>
<td align="left">pKLC102</td>
<td align="left">22,460</td>
<td align="left">Hybrid of plasmid and phage origin includes replication, partitioning, conjugation, pili, &#x26; integrase genes <xref ref-type="bibr" rid="B28">Klockgether et al. (2004)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx12.tif"/>
</td>
<td align="left">IPR021300</td>
<td align="left">22,284</td>
<td align="left">Integrating conjugative element protein <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx13.tif"/>
</td>
<td align="left">IPR022391</td>
<td align="left">21,465</td>
<td align="left">Integrating conjugative element relaxase, PFGI-1 class <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx14.tif"/>
</td>
<td align="left">IPR022303</td>
<td align="left">19,664</td>
<td align="left">Conjugative transfer ATPase <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx15.tif"/>
</td>
<td align="left">ICEPdaSpa1</td>
<td align="left">19,424</td>
<td align="left">An SXT-related ICE derived; causative agent of fish pasteurellosis <xref ref-type="bibr" rid="B43">Osorio et al. (2008)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx16.tif"/>
</td>
<td align="left">IPR014129</td>
<td align="left">18,029</td>
<td align="left">Conjugative transfer relaxase protein TraI <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx17.tif"/>
</td>
<td align="left">SXT</td>
<td align="left">17,525</td>
<td align="left">Family of conjugative-transposon-like mobile elements encoding multiple AR genes <xref ref-type="bibr" rid="B5">Beaber et al. (2002)</xref>; <xref ref-type="bibr" rid="B11">Burrus et al. (2006)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx18.tif"/>
</td>
<td align="left">ICEEc1</td>
<td align="left">10,170</td>
<td align="left">High-pathogenicity island (HPI); evidence for Combinatorial Transfers <xref ref-type="bibr" rid="B44">Paauw et al. (2010)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx19.tif"/>
</td>
<td align="left">R391</td>
<td align="left">9,916</td>
<td align="left">Archetype of IncJ; carries AR, DNA repair, &#x26; mercury resistance genes <xref ref-type="bibr" rid="B9">B&#xf6;ltner et al. (2002)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx20.tif"/>
</td>
<td align="left">ICEKp1</td>
<td align="left">9,117</td>
<td align="left">Resembles functional ICEEc1 <xref ref-type="bibr" rid="B44">Paauw et al. (2010)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx21.tif"/>
</td>
<td align="left">ICESde3396</td>
<td align="left">9,088</td>
<td align="left">Carries genes predicted to be involved in virulence and resistance to various metals <xref ref-type="bibr" rid="B63">Smyth et al. (2014)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx22.tif"/>
</td>
<td align="left">ICEBs1</td>
<td align="left">8,504</td>
<td align="left">Plasmid mobilization and putative coupling protein <xref ref-type="bibr" rid="B32">Lee et al. (2012)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx23.tif"/>
</td>
<td align="left">RD2</td>
<td align="left">8,370</td>
<td align="left">Encodes seven putative secreted extracellular proteins <xref ref-type="bibr" rid="B61">Sitkiewicz et al. (2011)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx24.tif"/>
</td>
<td align="left">IPR011952</td>
<td align="left">2,640</td>
<td align="left">Conserved hypothetical protein CHP02256 <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx25.tif"/>
</td>
<td align="left">IPR014136</td>
<td align="left">2,050</td>
<td align="left">Ti-type conjugative transfer relaxase TraA <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx26.tif"/>
</td>
<td align="left">TnGBS2</td>
<td align="left">1,630</td>
<td align="left">See ICE6013 <xref ref-type="bibr" rid="B20">Everitt et al. (2014)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx27.tif"/>
</td>
<td align="left">CTnBST</td>
<td align="left">1,520</td>
<td align="left">Tyrosine recombinase family <xref ref-type="bibr" rid="B65">Song et al. (2007)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx28.tif"/>
</td>
<td align="left">ICEclc</td>
<td align="left">1,465</td>
<td align="left">Cargo for ortho-cleavage of chlorocatechols and aminophenol metabolism (amr genes) <xref ref-type="bibr" rid="B41">Obi et al. (2018)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx29.tif"/>
</td>
<td align="left">GI3</td>
<td align="left">1,340</td>
<td align="left">Degradation of aromatic compounds and detoxification of heavy metals <xref ref-type="bibr" rid="B31">Lechner et al. (2009)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx30.tif"/>
</td>
<td align="left">Tn1549</td>
<td align="left">648</td>
<td align="left">VanB-type resistance to glycopeptides with regions <xref ref-type="bibr" rid="B23">Garnier et al. (2000)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx31.tif"/>
</td>
<td align="left">CTn341</td>
<td align="left">389</td>
<td align="left">Encodes tetracycline resistance and its transfer is induced by tetracycline <xref ref-type="bibr" rid="B48">Peed et al. (2010)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx32.tif"/>
</td>
<td align="left">IPR020369</td>
<td align="left">119</td>
<td align="left">Mobilisation protein B <xref ref-type="bibr" rid="B21">Finn et al. (2016)</xref>
</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left">(i) excision-integration process <xref ref-type="bibr" rid="B23">Garnier et al. (2000)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx33.tif"/>
</td>
<td align="left">Tn4555</td>
<td align="left">79</td>
<td align="left">Includes cfxA gene encoding</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left">broad-spectrum beta-lactamase <xref ref-type="bibr" rid="B62">Smith and Parker (1993)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx34.tif"/>
</td>
<td align="left">ICESt1</td>
<td align="left">26</td>
<td align="left">Integrative and putative transfer functions <xref ref-type="bibr" rid="B12">Burrus et al. (2002)</xref>; <xref ref-type="bibr" rid="B7">Bellanger et al. (2009)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx35.tif"/>
</td>
<td align="left">ICEMISymR7A</td>
<td align="left">16</td>
<td align="left">Rhizobial symbiosis genes <xref ref-type="bibr" rid="B53">Ramsay and Ronson (2015)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx36.tif"/>
</td>
<td align="left">ICESt3</td>
<td align="left">14</td>
<td align="left">Integrative and putative transfer functions <xref ref-type="bibr" rid="B7">Bellanger et al. (2009)</xref>
</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left">(ii) vanB2 operon replaces tet(M) <xref ref-type="bibr" rid="B23">Garnier et al. (2000)</xref>
</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left">(iii) Conjugative transfer <xref ref-type="bibr" rid="B23">Garnier et al. (2000)</xref>
</td>
</tr>
<tr>
<td>
<inline-graphic xlink:href="FGENE_fgene-2022-1024577_wc_tfx37.tif"/>
</td>
<td align="left">Tn4371</td>
<td align="left">0</td>
<td align="left">Biphenyl and 4-chlorobiphenyl degradation <xref ref-type="bibr" rid="B66">Springael et al. (1993)</xref>
</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-2">
<title>2.2 Inter- and intra-genus conjugation profiles</title>
<p>Of the 106,443 genomes that contained at least one conjugative feature, 95,781 shared at least one conjugative feature with at least one other genome in the set, indicating a common evolutionary history. These 95,781 conjugative genomes represented close to 47% (631 of the 1,345) of the genera contained in the relational database (<xref ref-type="bibr" rid="B58">Seabolt et al., 2020</xref>). The lack of conjugative machinery in the other 714 genera may be a false negative finding (i.e., incomplete list of conjugative features, lack of representation in the utilized NCBI databases, or lack of inclusion in genome assemblies), or could indicate inherent differences in the conjugative ability of genera across the taxonomic tree. Similarly, one might reasonably expect the number of observed conjugative genomes to scale with the number of genomes available for each genus. However, genus representation in NCBI is not uniform across genera, leading to bias in available genomes per genus. To correct for this imbalance, we computed the conjugative genome proportion by normalizing the number of observed conjugative genomes to the total number of genomes per genus (<xref ref-type="table" rid="T2">Table 2</xref>). This analysis demonstrated that the genera with the largest fraction of conjugative genomes were <italic>not</italic> the genera with the most genomes in NCBI. For example, although <italic>Salmonella</italic> had by far the greatest number of high quality genomes (N &#x3d; 39,574), it ranked fifth in terms of the proportion of genomes that contained a conjugative feature. The top 30 genera listed in <xref ref-type="table" rid="T2">Table 2</xref> all had a conjugative genome frequency greater than 20%, with genomes from the genus <italic>Legionella</italic> containing conjugative proteins over 99% of the time. This high percentage may have been driven by sampling bias in the available NCBI WGS datasets (for example, the <italic>Legionella pneumophila</italic> WGS accessions appear to have been collected from a single site), or it may represent the propensity for conjugation-mediated processes to occur within individual genera.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Proportion of genomes that contained conjugative feature(s), by genus. All genera with over 100 representative genomes are listed, in descending order by the proportion of conjugative genomes in each genus.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Genus</th>
<th align="left">Number of conjugative genomes</th>
<th align="left">Number of total genomes</th>
<th align="left">Proportion conjugative genomes</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Legionella</italic>
</td>
<td align="left">1,672</td>
<td align="left">1,686</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">
<italic>Shigella</italic>
</td>
<td align="left">5,423</td>
<td align="left">5,541</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="left">
<italic>Klebsiella</italic>
</td>
<td align="left">4,682</td>
<td align="left">5,304</td>
<td align="char" char=".">0.88</td>
</tr>
<tr>
<td align="left">
<italic>Elizabethkingia</italic>
</td>
<td align="left">102</td>
<td align="left">119</td>
<td align="char" char=".">0.86</td>
</tr>
<tr>
<td align="left">
<italic>Escherichia</italic>
</td>
<td align="left">8,140</td>
<td align="left">9,957</td>
<td align="char" char=".">0.82</td>
</tr>
<tr>
<td align="left">
<italic>Stenotrophomonas</italic>
</td>
<td align="left">441</td>
<td align="left">563</td>
<td align="char" char=".">0.78</td>
</tr>
<tr>
<td align="left">
<italic>Enterobacter</italic>
</td>
<td align="left">894</td>
<td align="left">1,210</td>
<td align="char" char=".">0.74</td>
</tr>
<tr>
<td align="left">
<italic>Vibrio</italic>
</td>
<td align="left">2,902</td>
<td align="left">4,017</td>
<td align="char" char=".">0.72</td>
</tr>
<tr>
<td align="left">
<italic>Acinetobacter</italic>
</td>
<td align="left">2,621</td>
<td align="left">3,770</td>
<td align="char" char=".">0.70</td>
</tr>
<tr>
<td align="left">
<italic>Pseudomonas</italic>
</td>
<td align="left">3,222</td>
<td align="left">4,750</td>
<td align="char" char=".">0.68</td>
</tr>
<tr>
<td align="left">
<italic>Enterococcus</italic>
</td>
<td align="left">1,003</td>
<td align="left">1,516</td>
<td align="char" char=".">0.66</td>
</tr>
<tr>
<td align="left">
<italic>Citrobacter</italic>
</td>
<td align="left">131</td>
<td align="left">203</td>
<td align="char" char=".">0.65</td>
</tr>
<tr>
<td align="left">
<italic>Salmonella</italic>
</td>
<td align="left">24,123</td>
<td align="left">38,808</td>
<td align="char" char=".">0.62</td>
</tr>
<tr>
<td align="left">
<italic>Clostridioides</italic>
</td>
<td align="left">1,329</td>
<td align="left">2,183</td>
<td align="char" char=".">0.61</td>
</tr>
<tr>
<td align="left">
<italic>Streptococcus</italic>
</td>
<td align="left">8,244</td>
<td align="left">13,766</td>
<td align="char" char=".">0.60</td>
</tr>
<tr>
<td align="left">
<italic>Xanthomonas</italic>
</td>
<td align="left">201</td>
<td align="left">357</td>
<td align="char" char=".">0.56</td>
</tr>
<tr>
<td align="left">
<italic>Staphylococcus</italic>
</td>
<td align="left">18,034</td>
<td align="left">32,661</td>
<td align="char" char=".">0.55</td>
</tr>
<tr>
<td align="left">
<italic>Rhizobium</italic>
</td>
<td align="left">110</td>
<td align="left">202</td>
<td align="char" char=".">0.54</td>
</tr>
<tr>
<td align="left">
<italic>Yersinia</italic>
</td>
<td align="left">215</td>
<td align="left">437</td>
<td align="char" char=".">0.49</td>
</tr>
<tr>
<td align="left">
<italic>Lactococcus</italic>
</td>
<td align="left">57</td>
<td align="left">117</td>
<td align="char" char=".">0.49</td>
</tr>
<tr>
<td align="left">
<italic>Serratia</italic>
</td>
<td align="left">230</td>
<td align="left">619</td>
<td align="char" char=".">0.37</td>
</tr>
<tr>
<td align="left">
<italic>Sinorhizobium</italic>
</td>
<td align="left">44</td>
<td align="left">121</td>
<td align="char" char=".">0.36</td>
</tr>
<tr>
<td align="left">
<italic>Bifidobacterium</italic>
</td>
<td align="left">137</td>
<td align="left">403</td>
<td align="char" char=".">0.34</td>
</tr>
<tr>
<td align="left">
<italic>Moraxella</italic>
</td>
<td align="left">65</td>
<td align="left">192</td>
<td align="char" char=".">0.34</td>
</tr>
<tr>
<td align="left">
<italic>Bacillus</italic>
</td>
<td align="left">471</td>
<td align="left">1,471</td>
<td align="char" char=".">0.32</td>
</tr>
<tr>
<td align="left">
<italic>Campylobacter</italic>
</td>
<td align="left">5,340</td>
<td align="left">19,501</td>
<td align="char" char=".">0.27</td>
</tr>
<tr>
<td align="left">
<italic>Aeromonas</italic>
</td>
<td align="left">80</td>
<td align="left">312</td>
<td align="char" char=".">0.26</td>
</tr>
<tr>
<td align="left">
<italic>Brucella</italic>
</td>
<td align="left">230</td>
<td align="left">970</td>
<td align="char" char=".">0.24</td>
</tr>
<tr>
<td align="left">
<italic>Mesorhizobium</italic>
</td>
<td align="left">89</td>
<td align="left">385</td>
<td align="char" char=".">0.23</td>
</tr>
<tr>
<td align="left">
<italic>Helicobacter</italic>
</td>
<td align="left">118</td>
<td align="left">529</td>
<td align="char" char=".">0.22</td>
</tr>
<tr>
<td align="left">
<italic>Streptomyces</italic>
</td>
<td align="left">74</td>
<td align="left">333</td>
<td align="char" char=".">0.22</td>
</tr>
<tr>
<td align="left">
<italic>Corynebacterium</italic>
</td>
<td align="left">133</td>
<td align="left">639</td>
<td align="char" char=".">0.21</td>
</tr>
<tr>
<td align="left">
<italic>Neisseria</italic>
</td>
<td align="left">153</td>
<td align="left">781</td>
<td align="char" char=".">0.20</td>
</tr>
<tr>
<td align="left">
<italic>Burkholderia</italic>
</td>
<td align="left">341</td>
<td align="left">2,053</td>
<td align="char" char=".">0.17</td>
</tr>
<tr>
<td align="left">
<italic>Haemophilus</italic>
</td>
<td align="left">65</td>
<td align="left">403</td>
<td align="char" char=".">0.16</td>
</tr>
<tr>
<td align="left">
<italic>Lactobacillus</italic>
</td>
<td align="left">144</td>
<td align="left">962</td>
<td align="char" char=".">0.15</td>
</tr>
<tr>
<td align="left">
<italic>Listeria</italic>
</td>
<td align="left">848</td>
<td align="left">7,716</td>
<td align="char" char=".">0.11</td>
</tr>
<tr>
<td align="left">
<italic>Clostridium</italic>
</td>
<td align="left">40</td>
<td align="left">454</td>
<td align="char" char=".">0.09</td>
</tr>
<tr>
<td align="left">
<italic>Mycobacterium</italic>
</td>
<td align="left">1,120</td>
<td align="left">13,129</td>
<td align="char" char=".">0.09</td>
</tr>
<tr>
<td align="left">
<italic>Cutibacterium</italic>
</td>
<td align="left">10</td>
<td align="left">118</td>
<td align="char" char=".">0.08</td>
</tr>
<tr>
<td align="left">
<italic>Bordetella</italic>
</td>
<td align="left">60</td>
<td align="left">733</td>
<td align="char" char=".">0.08</td>
</tr>
<tr>
<td align="left">
<italic>Chlamydia</italic>
</td>
<td align="left">33</td>
<td align="left">496</td>
<td align="char" char=".">0.07</td>
</tr>
<tr>
<td align="left">Bartonella</td>
<td align="left">3</td>
<td align="left">124</td>
<td align="char" char=".">0.02</td>
</tr>
<tr>
<td align="left">
<italic>Mycoplasma</italic>
</td>
<td align="left">2</td>
<td align="left">251</td>
<td align="char" char=".">0.01</td>
</tr>
<tr>
<td align="left">
<italic>Francisella</italic>
</td>
<td align="left">0</td>
<td align="left">120</td>
<td align="char" char=".">0.00</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Next, we identified a total of 5,956 conjugation proteins across genus pairs, i.e., triples of the form (genus1, genus2, protein-name), associated with a total of 23,353,196,048 cargo protein sequences. These results are visualizable as connected nodes in the ggMOB network. This count is non-distinct by protein name as, for instance, Tyrosine recombinase XerD was found both between Salmonella-Salmonella genomes, as well as between Oligella-Proteus genomes and other genera pairs. Of these 5,956 triples, 1,680 contained genome pairs belonging to the same genus (i.e., intra-genus). Some genera were much more likely to contain genomes with conjugative features that matched to genomes from other genera, i.e., inter-genus. For example, we observed over 30 million instances of matching conjugation proteins in genomes from the <italic>Acinetobacter</italic> genus. Of these instances, 84% were to genomes from other genera (i.e., inter-genus), <italic>versus</italic> 16% from genomes within <italic>Acinetobacter</italic> (i.e., intra-genus). Members of the <italic>Acinetobacter</italic> genus are well-known for genome plasticity (<xref ref-type="bibr" rid="B14">Chan et al., 2015</xref>), which contributes to important phenotypes such as AMR and biofilm formation.</p>
<p>Genera that shared the highest number of conjugation proteins with <italic>Acinetobacter</italic> genomes included <italic>Escherichia</italic>, <italic>Shigella</italic>, <italic>Vibrio</italic>, <italic>Salmonella</italic>, <italic>Pseudomonas</italic>, <italic>Klebsiella</italic>, <italic>Enterobacter</italic> and <italic>Citrobacter</italic>. While this result was not unexpected given the list of known pathogens contained within these genera, our database of intra- and inter-genus exact-match conjugative features also revealed many unreported and unexpected associations. For example, genomes within the genus Nitrosomonas contained 38,034 instances of conjugative proteins, nearly 100% of which were shared with genomes from the <italic>Shigella</italic> genus. The specific conjugative feature involved in the vast majority of these exact matches was ICEEc2, a relatively recently discovered ICE MGE that was previously shown to transfer competently between <italic>Salmonella enterica</italic> serovar Typhimurium strain and into a <italic>Yersinia pseudotuberculosis</italic> strain. Our results suggest that ICEEc2 has a very broad host-donor range, including many genera that may not yet be described in the literature in reference to this particular ICE.</p>
<p>We found that the likelihood of identifying conjugative features in pairs of genomes within <italic>versus</italic> across genera was highly variable. Of the 36 conjugative features analyzed, 13 were only identified in pairs of genomes belonging to the same genus, i.e., intra-genus (<xref ref-type="table" rid="T3">Table 3</xref>). However, six conjugative features were more likely to be observed across genera than within genera, i.e., <inline-formula id="inf1">
<mml:math id="m1">
<mml:mo>&#x3e;</mml:mo>
<mml:mn>50</mml:mn>
<mml:mi>%</mml:mi>
</mml:math>
</inline-formula> of the observations were inter-genus (<xref ref-type="table" rid="T3">Table 3</xref>). For example, the exact same CTn341 sequence was observed in pairs of genomes a total of 10,796 times; in 72% of these instances, the pairs of genomes belonged to different genera, indicating a history of inter-genus transfer of CTn341. This conjugative feature belongs to the ICE family of MGEs and plays an important role in tetracycline resistance, and is typically associated with the genus <italic>Bacteroides</italic>, including in most reports related to its functionality (<xref ref-type="bibr" rid="B3">Bacic et al., 2005</xref>). However, we observed that 17% of the genome pairs containing exact-match CTn341 sequences belonged to the <italic>Bacteroides</italic> and Alistipes genera, suggesting historical transfer of this important ICE between these genera. Alistipes is an emerging genus with potential health implications (<xref ref-type="bibr" rid="B46">Parker et al., 2020</xref>), and the epidemiology and ecology of CTn341 within this genus warrants further investigation. Furthermore, this finding provides additional insight into the potential importance of CTn341 in spreading tetracycline resistance genes across microbial taxa.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Count and proportion of inter- and intra-genus detection of conjugative features.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="1" align="left">Conjugative</th>
<th colspan="1" align="left">No. Inter-genus</th>
<th colspan="1" align="left">Prop. Inter-genus</th>
<th colspan="1" align="left">No. of intra-genus</th>
<th colspan="1" align="left">Prop. Intra-genus</th>
</tr>
<tr>
<th align="left">Feature</th>
<th align="left">Matches</th>
<th align="left">Matches</th>
<th align="left">Matches</th>
<th align="left">Matches</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">IPR014059</td>
<td align="left">122,066</td>
<td align="left">0.02</td>
<td align="left">6,098,286</td>
<td align="left">0.98</td>
</tr>
<tr>
<td align="left">IPR014862</td>
<td align="left">123,175</td>
<td align="left">0.02</td>
<td align="left">6,246,342</td>
<td align="left">0.98</td>
</tr>
<tr>
<td align="left">IPR005094</td>
<td align="left">415,744</td>
<td align="left">0.11</td>
<td align="left">3,224,556</td>
<td align="left">0.89</td>
</tr>
<tr>
<td align="left">IPR014136</td>
<td align="left">43</td>
<td align="left">0.00</td>
<td align="left">83,448</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">Tn916</td>
<td align="left">110,710,102</td>
<td align="left">0.61</td>
<td align="left">71,585,305</td>
<td align="left">0.39</td>
</tr>
<tr>
<td align="left">GI3</td>
<td align="left">74,775</td>
<td align="left">0.20</td>
<td align="left">304,550</td>
<td align="left">0.80</td>
</tr>
<tr>
<td align="left">ICEPdaSpa1</td>
<td align="left">8,356,908</td>
<td align="left">0.37</td>
<td align="left">14,101,581</td>
<td align="left">0.63</td>
</tr>
<tr>
<td align="left">ICEclc</td>
<td align="left">75,322</td>
<td align="left">0.20</td>
<td align="left">304,722</td>
<td align="left">0.80</td>
</tr>
<tr>
<td align="left">ICEhin1056</td>
<td align="left">128,834,838</td>
<td align="left">0.69</td>
<td align="left">58,590,390</td>
<td align="left">0.31</td>
</tr>
<tr>
<td align="left">IPR011119</td>
<td align="left">454,906</td>
<td align="left">0.03</td>
<td align="left">16,981,338</td>
<td align="left">0.97</td>
</tr>
<tr>
<td align="left">IPR021300</td>
<td align="left">69,832</td>
<td align="left">0.00</td>
<td align="left">20,685,606</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">IPR022303</td>
<td align="left">44,341</td>
<td align="left">0.01</td>
<td align="left">7,859,462</td>
<td align="left">0.99</td>
</tr>
<tr>
<td align="left">IPR022391</td>
<td align="left">52,638</td>
<td align="left">0.00</td>
<td align="left">14,265,248</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">IPR025955</td>
<td align="left">55,3687</td>
<td align="left">0.02</td>
<td align="left">32,073,159</td>
<td align="left">0.98</td>
</tr>
<tr>
<td align="left">SXT</td>
<td align="left">17,427,985</td>
<td align="left">0.58</td>
<td align="left">12,525,984</td>
<td align="left">0.42</td>
</tr>
<tr>
<td align="left">CTn341</td>
<td align="left">7,760</td>
<td align="left">0.72</td>
<td align="left">3,036</td>
<td align="left">0.28</td>
</tr>
<tr>
<td align="left">ICEEc1</td>
<td align="left">1,107,736</td>
<td align="left">0.18</td>
<td align="left">5,010,865</td>
<td align="left">0.82</td>
</tr>
<tr>
<td align="left">ICEEc2</td>
<td align="left">28,902,519</td>
<td align="left">0.33</td>
<td align="left">58,830,977</td>
<td align="left">0.67</td>
</tr>
<tr>
<td align="left">ICEKp1</td>
<td align="left">1,629,343</td>
<td align="left">0.20</td>
<td align="left">6,550,799</td>
<td align="left">0.80</td>
</tr>
<tr>
<td align="left">IPR011952</td>
<td align="left">50</td>
<td align="left">0.00</td>
<td align="left">3,154,129</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">IPR014129</td>
<td align="left">75,786</td>
<td align="left">0.02</td>
<td align="left">4,557,985</td>
<td align="left">0.98</td>
</tr>
<tr>
<td align="left">R391</td>
<td align="left">796,084</td>
<td align="left">0.10</td>
<td align="left">7,476,937</td>
<td align="left">0.90</td>
</tr>
<tr>
<td align="left">Tn4555</td>
<td align="left">972</td>
<td align="left">0.72</td>
<td align="left">382</td>
<td align="left">0.28</td>
</tr>
<tr>
<td align="left">pKLC102</td>
<td align="left">10,135</td>
<td align="left">0.00</td>
<td align="left">5,277,724</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">IPR020369</td>
<td align="left">577</td>
<td align="left">0.12</td>
<td align="left">4,406</td>
<td align="left">0.88</td>
</tr>
<tr>
<td align="left">Tn1549</td>
<td align="left">866</td>
<td align="left">0.04</td>
<td align="left">23,336</td>
<td align="left">0.96</td>
</tr>
<tr>
<td align="left">ICESde3396</td>
<td align="left">7,659</td>
<td align="left">0.00</td>
<td align="left">1,676,016</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">CTnBST</td>
<td align="left">337,318</td>
<td align="left">0.63</td>
<td align="left">196,675</td>
<td align="left">0.37</td>
</tr>
<tr>
<td align="left">ICEBs1</td>
<td align="left">0</td>
<td align="left">0.00</td>
<td align="left">1,220,869</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">ICE6013</td>
<td align="left">46,112</td>
<td align="left">0.00</td>
<td align="left">406,783,868</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">ICESt1</td>
<td align="left">31</td>
<td align="left">0.12</td>
<td align="left">237</td>
<td align="left">0.88</td>
</tr>
<tr>
<td align="left">ICEMISymR7A</td>
<td align="left">0</td>
<td align="left">0.00</td>
<td align="left">37</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">PAPI-1</td>
<td align="left">0</td>
<td align="left">0.00</td>
<td align="left">6,101,539</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">ICESt3</td>
<td align="left">0</td>
<td align="left">0.00</td>
<td align="left">97</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">RD2</td>
<td align="left">0</td>
<td align="left">0.00</td>
<td align="left">1,547,322</td>
<td align="left">1.00</td>
</tr>
<tr>
<td align="left">TnGBS2</td>
<td align="left">0</td>
<td align="left">0.00</td>
<td align="left">56,243</td>
<td align="left">1.00</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-3">
<title>2.3 Cargo gene profiles</title>
<p>To characterize the set of genes that are most likely to have been associated with conjugative HGT events, we identified all proteins that were contained in at least two conjugative genomes with 100% sequence identity. Out of 51,362,178 total unique protein sequences in the source database, 28,042 were identified as conjugation-associated proteins (i.e., conjugation machinery), and 11,276,651 were identified as candidate cargo proteins. The full set of cargo proteins mapped to 20,550 distinct names (excluding &#x201c;putative protein(s)&#x201d; or &#x201c;hypothetical protein(s)&#x201d;), with a wide range of frequencies within and between genera. Annotation of the conjugative genomes demonstrated that the vast majority of conjugative and cargo proteins were adjacent within the genome (<xref ref-type="fig" rid="F2">Figure 2</xref>). Moreover, within each genome, the conjugative features were more likely to be proximate to putative cargo protein <italic>versus</italic> non-cargo proteins, suggesting again a common evolutionary history.</p>
</sec>
<sec id="s2-4">
<title>2.4 Genotypic AMR and association with conjugation features</title>
<p>A subset of the observed cargo protein names were associated with a set of confirmed AMR protein names. We identified this subset by selecting only those names that Prokka assigned to sequences mapping to a name defined in MEGARes v1.0 (<xref ref-type="bibr" rid="B30">Lakin et al., 2016</xref>), a comprehensive AMR database. The entity relations in our database ensured a 1:1 mapping between gene and protein names and their respective sequences. Of the 3,824 distinct sequences contained in MEGARes, Prokka identified 3,674 as valid sequences coding for protein. These 3,674 distinct proteins were assigned 286 distinct names, excluding &#x201c;putative protein&#x201d; and &#x201c;hypothetical protein&#x201d;. These unnamed proteins comprised just 1% of the MEGARes protein set. While this highly curated set is certainly not a comprehensive list of all proteins contributing to AMR, it is an initial set to estimate the fraction of AMR proteins within the larger set of conjugation and cargo proteins.</p>
<p>To further investigate the microbial genomics of AMR in relation to HGT events, we used plasmid sequences from NCBI to identify the set of AMR-specific cargo proteins found in a plasmid sequence. We then compared the distribution of AMR proteins in plasmids <italic>versus</italic> conjugative genomes (<xref ref-type="fig" rid="F3">Figure 3</xref>). The distribution of AMR genes differed between plasmids and conjugative genomes, with a high probability that AMR genes were identified in conjugative (<italic>versus</italic> non-conjugative) genomes, and a much lower probability of being identified in plasmids (<xref ref-type="fig" rid="F3">Figure 3</xref>). While plasmids are often critical to the microbial ecology of AMR, this analysis suggests that other conjugative processes may drive the vast majority of AMR gene exchanges between bacteria. This dynamic has been reported for specific AMR gene groups, including carbapenem AMR genes (<xref ref-type="bibr" rid="B10">Botelho et al., 2020</xref>), and also supports previous analyses of conjugative machinery across bacterial genera (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>).</p>
<p>To analyze the distribution of AMR proteins across genomes, we calculated the probability that each AMR gene was identified in conjugative <italic>versus</italic> non-conjugative genomes (<xref ref-type="table" rid="T4">Table 4</xref>). From the complete list of 286 AMR protein names, 220 were found more often in conjugative genomes; three were found with equal probability in conjugative and non-conjugative genomes; and 63 were found more often in genomes that did not contain any conjugation proteins. Given that the proportion of conjugative genomes in our database was 51%, these results suggest that AMR genes are disproportionately represented within conjugative genomes.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Probability of observing AMR proteins in genomes that also contained conjugative features.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">AMR protein name</th>
<th align="left">Number of Genomes</th>
<th align="left">Number of Conjugative Genomes</th>
<th align="left">Proportion Conjugative Genomes</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Rob DNA-binding transcriptional activator</td>
<td align="left">4,559</td>
<td align="left">4,559</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="left">Transposon Tn10 TetD protein</td>
<td align="left">4,559</td>
<td align="left">4,559</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="left">Tetracycline resistance gene Tet(M)</td>
<td align="left">441</td>
<td align="left">441</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="left">Outer membrane protein YedS</td>
<td align="left">288</td>
<td align="left">288</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="left">Regulator of RpoS</td>
<td align="left">288</td>
<td align="left">288</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="left">Beta-lactamase Toho-1</td>
<td align="left">319</td>
<td align="left">318</td>
<td align="char" char=".">1.00</td>
</tr>
<tr>
<td align="left">AcrAD-TolC permease subunit</td>
<td align="left">1,584</td>
<td align="left">1,576</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Multidrug efflux pump subunit AcrB</td>
<td align="left">1,584</td>
<td align="left">1,576</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">DNA topoisomerase subunit A</td>
<td align="left">1,091</td>
<td align="left">1,085</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">MATE family multidrug efflux pump protein</td>
<td align="left">1,607</td>
<td align="left">1,596</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Carbapenem-hydrolyzing beta-lactamase KPC</td>
<td align="left">1,914</td>
<td align="left">1,899</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Beta-lactamase OXA-1</td>
<td align="left">1,188</td>
<td align="left">1,175</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Inner membrane protein HsrA</td>
<td align="left">350</td>
<td align="left">346</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Putative transport protein YdhC</td>
<td align="left">342</td>
<td align="left">338</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Aclacinomycin methylesterase RdmC</td>
<td align="left">419</td>
<td align="left">414</td>
<td align="char" char=".">0.99</td>
</tr>
<tr>
<td align="left">Beta-lactamase OXA-2</td>
<td align="left">199</td>
<td align="left">196</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="left">Chloramphenicol efflux MFS transporter CmlA1</td>
<td align="left">795</td>
<td align="left">783</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="left">Beta-lactamase OXA-10</td>
<td align="left">521</td>
<td align="left">513</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="left">armA&#x2a;</td>
<td align="left">994</td>
<td align="left">978</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="left">rRNA large subunit methyltransferase H</td>
<td align="left">4,087</td>
<td align="left">3,989</td>
<td align="char" char=".">0.98</td>
</tr>
<tr>
<td align="left">Multidrug resistance operon repressor</td>
<td align="left">486</td>
<td align="left">67</td>
<td align="char" char=".">0.14</td>
</tr>
<tr>
<td align="left">Outer membrane protein OprM</td>
<td align="left">478</td>
<td align="left">65</td>
<td align="char" char=".">0.14</td>
</tr>
<tr>
<td align="left">Methicillin-resistance regulatory protein MecR1</td>
<td align="left">8,344</td>
<td align="left">1,007</td>
<td align="char" char=".">0.12</td>
</tr>
<tr>
<td align="left">Phosphoethanolamine-lipid A transferase</td>
<td align="left">8,344</td>
<td align="left">1,007</td>
<td align="char" char=".">0.12</td>
</tr>
<tr>
<td align="left">HTH-type transcriptional repressor BepR</td>
<td align="left">467</td>
<td align="left">55</td>
<td align="char" char=".">0.12</td>
</tr>
<tr>
<td align="left">Bifunctional polymyxin resistance protein ArnA</td>
<td align="left">507</td>
<td align="left">53</td>
<td align="char" char=".">0.10</td>
</tr>
<tr>
<td align="left">Methicillin resistance regulatory protein MecI</td>
<td align="left">6,583</td>
<td align="left">395</td>
<td align="char" char=".">0.06</td>
</tr>
<tr>
<td align="left">Metallothiol transferase FosB</td>
<td align="left">6,584</td>
<td align="left">395</td>
<td align="char" char=".">0.06</td>
</tr>
<tr>
<td align="left">Multidrug efflux transporter MdtL</td>
<td align="left">419</td>
<td align="left">9</td>
<td align="char" char=".">0.02</td>
</tr>
<tr>
<td align="left">Multidrug efflux pump subunit AcrA</td>
<td align="left">420</td>
<td align="left">7</td>
<td align="char" char=".">0.02</td>
</tr>
<tr>
<td align="left">HTH-type transcriptional regulator SyrM 1</td>
<td align="left">414</td>
<td align="left">3</td>
<td align="char" char=".">0.01</td>
</tr>
<tr>
<td align="left">RND transporter permease subunit OqxB3</td>
<td align="left">358</td>
<td align="left">2</td>
<td align="char" char=".">0.01</td>
</tr>
<tr>
<td align="left">Aminoglycoside 2&#x2032;-N-acetyltransferase</td>
<td align="left">9,723</td>
<td align="left">5</td>
<td align="char" char=".">0.00</td>
</tr>
<tr>
<td align="left">DNA-binding response regulator MtrA</td>
<td align="left">9,854</td>
<td align="left">2</td>
<td align="char" char=".">0.00</td>
</tr>
<tr>
<td align="left">Putative acetyltransferase</td>
<td align="left">5,232</td>
<td align="left">1</td>
<td align="char" char=".">0.00</td>
</tr>
<tr>
<td align="left">Quinolone resistance protein NorB</td>
<td align="left">213</td>
<td align="left">0</td>
<td align="char" char=".">0.00</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>Only AMR proteins that appeared in more than 100 genomes were considered; and only AMR proteins that occurred in conjugative genomes with a probability <inline-formula id="inf2">
<mml:math id="m2">
<mml:mo>&#x2265;</mml:mo>
<mml:mn>0.98</mml:mn>
</mml:math>
</inline-formula> or <inline-formula id="inf3">
<mml:math id="m3">
<mml:mo>&#x2264;</mml:mo>
<mml:mn>0.15</mml:mn>
</mml:math>
</inline-formula> are listed in this table. Full data available in the <xref ref-type="sec" rid="s9">Supplementary Table S3</xref>. &#x2a;Full protein name: 16S rRNA (guanine(1405)-N(7))-methyltransferase.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The above analysis does not distinguish between different types of conjugation features, and also treats AMR proteins as independent features. However, the data in <xref ref-type="fig" rid="F2">Figure 2</xref> demonstrate that many of the conjugation features defined in <xref ref-type="table" rid="T1">Table 1</xref> often co-occur in the same genome, as do some of the AMR proteins. To gain insight into these correlations, and to identify groups of AMR proteins associated with different conjugation families, we performed a genomic co-occurrence analysis across all conjugation features for the 138 AMR proteins found in conjugative genomes with a frequency of at least 5 times compared to identification in non-conjugative genomes (i.e., these AMR proteins were highly represented in conjugative genomes, <xref ref-type="fig" rid="F4">Figure 4</xref>). The results of this analysis demonstrated that some conjugation features frequently co-occurred within genomes with both other conjugation features as well as multiple AMR proteins. For example, IPR005094 co-occurred with the highest diversity of AMR protein names (N &#x3d; 139, see <xref ref-type="sec" rid="s9">Supplementary Table S2</xref>). Many co-occurrence patterns reflected known biological associations. For example, the Tn916 conjugation feature co-occurred most frequently with tetracycline ribosomal protection protein TetM, a genomic association discovered over 3&#xa0;decades ago (<xref ref-type="bibr" rid="B68">Su et al., 1992</xref>). While TetM seemed to co-occur with a few select conjugation features (such as Tn916), other AMR protein names co-occurred with many conjugation features. For example, many of the AMR names associated with extended-spectrum beta-lactam and carbapenem resistance (e.g., beta-lactamases Toho-1, OXA-1, OXa-2, OXA-10, SHV-2, and KPC) co-occured with the majority of evaluated conjugation features, which may provide partial explanation for the observed rapid expansion of these important AMR genes within Enterobacteriaceae (<xref ref-type="bibr" rid="B33">Logan and Weinstein, 2017</xref>). Similarly, the recently widely-publicized mcr-1 protein co-occurred with multiple conjugation features, which both strengthens and expands upon recent findings that this AMR gene has been mobilized on numerous plasmid types (<xref ref-type="bibr" rid="B72">Wang et al., 2018</xref>). Co-occurrence data such as those provided in <xref ref-type="fig" rid="F4">Figure 4</xref> may represent a new and sustainable (i.e., easily updated) source of information regarding the potential for new and emerging AMR genes to expand within and across bacterial populations <italic>via</italic> HGT. This information, in turn, could help to prioritize and focus public health and human clinical decision-making regarding AMR.</p>
<p>Conversely, 29 AMR proteins occurred at least 5x more frequently in non-conjugative genomes compared to conjugative genomes (<xref ref-type="sec" rid="s9">Supplementary Figure S1</xref>). Of note is the observation that no beta-lactam AMR protein names occur in this list of 29 AMR names, which contrasts starkly to the preponderance of beta-lactam-associated AMR names in <xref ref-type="fig" rid="F4">Figure 4</xref>, again suggesting that beta-lactam resistance is tightly coupled with conjugative machinery, and that conjugation-mediated exchange is the primary evolutionary driver of beta-lactam resistance. By comparison, several mechanisms of multi-drug resistance (MDR) are contained within the list of 29 AMR proteins observed more frequently in non-conjugative <italic>versus</italic> conjugative genomes, i.e., AcrB, AcrE, OqxB7, mdtA, mdtE, mdtH, and MexB. These mechanisms of MDR tend to be multi-function, i.e., the proteins confer multiple functional benefits to bacteria, in addition to AMR. Together, the results of <xref ref-type="fig" rid="F4">Figure 4</xref> and <xref ref-type="sec" rid="s9">Supplementary Figure S1</xref> suggest that proteins with more specific AMR functions tend to be disproportionately represented amongst conjugative genomes, while more generalist proteins tend to be disproportionately represented within non-conjugative genomes. One hypothesis for this observation is that the fitness cost-benefit dynamics differ for generalist <italic>versus</italic> specialist genes, such that specialized genes are more likely to transiently yet rapidly spread within bacterial populations <italic>via</italic> the so-called &#x2018;accessory genome&#x2019; (which includes conjugation-mediated exchange), whereas generalist genes are more likely to be maintained permanently within bacterial genomes, and thus are less likely to be identified as conjugation-associated cargo.</p>
</sec>
<sec id="s2-5">
<title>2.5 Phenotypic AMR and association with conjugative genomes</title>
<p>Given our hypothesis that conjugation-mediated spread of specialized AMR genes may be promoted by more specific evolutionary pressures such as antimicrobial drug exposures, we hypothesized that this signature of selective pressure may also manifest in the phenotypic properties of conjugative <italic>versus</italic> non-conjugative genomes. To evaluate this, we queried the NCBI BioSample assay metadata in our relational database, to identify isolates that had been subjected to phenotypic antibiotic susceptibility testing (AST) to known antibiotic compounds. For the 186,887 highest quality genomes, the NCBI assay metadata contained 15,286 phenotypically-confirmed resistant genome-compound AST results, representing 13,076 tests for conjugative genomes and 2,210 tests for non-conjugative genomes. Altogether, 1,242 genomes were used in these tests, of which 1,023 were conjugative genomes and 219 were non-conjugative genomes. For each antibiotic compound listed in the AST results, we computed the number of phenotypically resistant isolates with conjugative-vs. non-conjugative genomes.</p>
<p>The results of this analysis revealed that phenotypic resistance occurred in conjugative genomes with probability &#x3e;80%, regardless of compound being tested (<xref ref-type="table" rid="T5">Table 5</xref> and <xref ref-type="sec" rid="s9">Supplementary Table S3</xref>). As with the disproportionate representation of AMR proteins within conjugative genomes, the phenotypic AMR data suggest that microbial AMR dynamics are driven largely by conjugation-mediated processes. However, it is also important to note that NCBI phenotypic assay data is likely biased due to the motivations for clinicians and researchers to submit isolates for phenotypic testing. Therefore, to test for SRA sampling bias with respect to these compounds, we also measured the phenotypically-resistant fraction expected for <italic>randomly selected</italic> genomes, based on the number of genomes tested per compound in <xref ref-type="table" rid="T5">Table 5</xref> and the number of conjugative and non-conjugative genomes across the entire database. This null hypothesis was tested by running 100 bootstrapped trials for each compound (<xref ref-type="table" rid="T3">Table 3</xref>). The observed average probability that phenotypic AMR was expressed by an isolate with a conjugative genome was 0.85 &#xb1; 0.05 <italic>independent of antibiotic compound</italic>, i.e., weighted by total genomes tested per compound (<xref ref-type="table" rid="T5">Table 5</xref>). In a random process, the probability would be expected to be near 51% given the fraction of all genomes with conjugation features. These results further support the importance of conjugation in the microbial ecology and epidemiology of both genotypic and phenotypic AMR.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Associations between phenotypic AMR and representation of conjugative <italic>versus</italic> non-conjugative genomes.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Antibiotic</th>
<th align="left">Number of Resistant Genomes</th>
<th align="left">Number of Resistant Conjugative Genomes</th>
<th align="left">Expected Number of Resistant Conjugative Genomes<sup>&#x2a;</sup>
</th>
<th align="left">Observed Proportion Conjugative Genomes</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">doripenem</td>
<td align="char" char=".">215</td>
<td align="char" char=".">207</td>
<td align="char" char="plusmn">86 &#xb1; 7</td>
<td align="char" char=".">0.96</td>
</tr>
<tr>
<td align="left">cefepime</td>
<td align="char" char=".">272</td>
<td align="char" char=".">259</td>
<td align="char" char="plusmn">108 &#xb1; 8</td>
<td align="char" char=".">0.95</td>
</tr>
<tr>
<td align="left">ampicillin-sulbactam</td>
<td align="char" char=".">433</td>
<td align="char" char=".">402</td>
<td align="char" char="plusmn">173 &#xb1; 10</td>
<td align="char" char=".">0.93</td>
</tr>
<tr>
<td align="left">imipenem</td>
<td align="char" char=".">429</td>
<td align="char" char=".">396</td>
<td align="char" char="plusmn">171 &#xb1; 11</td>
<td align="char" char=".">0.92</td>
</tr>
<tr>
<td align="left">piperacillin-tazobactam</td>
<td align="char" char=".">280</td>
<td align="char" char=".">258</td>
<td align="char" char="plusmn">112 &#xb1; 9</td>
<td align="char" char=".">0.92</td>
</tr>
<tr>
<td align="left">meropenem</td>
<td align="char" char=".">402</td>
<td align="char" char=".">367</td>
<td align="char" char="plusmn">161 &#xb1; 11</td>
<td align="char" char=".">0.91</td>
</tr>
<tr>
<td align="left">trimethoprim-sulfamethoxazole</td>
<td align="char" char=".">868</td>
<td align="char" char=".">775</td>
<td align="char" char="plusmn">348 &#xb1; 14</td>
<td align="char" char=".">0.89</td>
</tr>
<tr>
<td align="left">ertapenem</td>
<td align="char" char=".">222</td>
<td align="char" char=".">197</td>
<td align="char" char="plusmn">89 &#xb1; 8</td>
<td align="char" char=".">0.89</td>
</tr>
<tr>
<td align="left">levofloxacin</td>
<td align="char" char=".">741</td>
<td align="char" char=".">644</td>
<td align="char" char="plusmn">297 &#xb1; 14</td>
<td align="char" char=".">0.87</td>
</tr>
<tr>
<td align="left">gentamicin</td>
<td align="char" char=".">813</td>
<td align="char" char=".">706</td>
<td align="char" char="plusmn">325 &#xb1; 13</td>
<td align="char" char=".">0.87</td>
</tr>
<tr>
<td align="left">ciprofloxacin</td>
<td align="char" char=".">915</td>
<td align="char" char=".">794</td>
<td align="char" char="plusmn">367 &#xb1; 14</td>
<td align="char" char=".">0.87</td>
</tr>
<tr>
<td align="left">amoxicillin-clavulanic acid</td>
<td align="char" char=".">277</td>
<td align="char" char=".">240</td>
<td align="char" char="plusmn">111 &#xb1; 8</td>
<td align="char" char=".">0.87</td>
</tr>
<tr>
<td align="left">ceftriaxone</td>
<td align="char" char=".">984</td>
<td align="char" char=".">849</td>
<td align="char" char="plusmn">394 &#xb1; 16</td>
<td align="char" char=".">0.86</td>
</tr>
<tr>
<td align="left">tetracycline</td>
<td align="char" char=".">700</td>
<td align="char" char=".">603</td>
<td align="char" char="plusmn">281 &#xb1; 12</td>
<td align="char" char=".">0.86</td>
</tr>
<tr>
<td align="left">ceftazidime</td>
<td align="char" char=".">852</td>
<td align="char" char=".">731</td>
<td align="char" char="plusmn">342 &#xb1; 14</td>
<td align="char" char=".">0.86</td>
</tr>
<tr>
<td align="left">cefotaxime</td>
<td align="char" char=".">889</td>
<td align="char" char=".">758</td>
<td align="char" char="plusmn">355 &#xb1; 15</td>
<td align="char" char=".">0.85</td>
</tr>
<tr>
<td align="left">tobramycin</td>
<td align="char" char=".">674</td>
<td align="char" char=".">574</td>
<td align="char" char="plusmn">270 &#xb1; 12</td>
<td align="char" char=".">0.85</td>
</tr>
<tr>
<td align="left">ampicillin</td>
<td align="char" char=".">1042</td>
<td align="char" char=".">852</td>
<td align="char" char="plusmn">418 &#xb1; 16</td>
<td align="char" char=".">0.82</td>
</tr>
<tr>
<td align="left">amikacin</td>
<td align="char" char=".">383</td>
<td align="char" char=".">313</td>
<td align="char" char="plusmn">154 &#xb1; 10</td>
<td align="char" char=".">0.82</td>
</tr>
<tr>
<td align="left">aztreonam</td>
<td align="char" char=".">989</td>
<td align="char" char=".">805</td>
<td align="char" char="plusmn">397 &#xb1; 15</td>
<td align="char" char=".">0.81</td>
</tr>
<tr>
<td align="left">cefazolin</td>
<td align="char" char=".">1002</td>
<td align="char" char=".">813</td>
<td align="char" char="plusmn">402 &#xb1; 16</td>
<td align="char" char=".">0.81</td>
</tr>
<tr>
<td align="left">cefoxitin</td>
<td align="char" char=".">757</td>
<td align="char" char=".">608</td>
<td align="char" char="plusmn">304 &#xb1; 15</td>
<td align="char" char=".">0.8</td>
</tr>
<tr>
<td align="left">nitrofurantoin</td>
<td align="char" char=".">713</td>
<td align="char" char=".">559</td>
<td align="char" char="plusmn">287 &#xb1; 12</td>
<td align="char" char=".">0.78</td>
</tr>
<tr>
<td align="left">cefotetan</td>
<td align="char" char=".">124</td>
<td align="char" char=".">95</td>
<td align="char" char="plusmn">49 &#xb1; 6</td>
<td align="char" char=".">0.77</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>
<sup>&#x2a;</sup>Only drug compounds with 100 or more non-redundant resistant genome measurements and &#x3e;76% representation in conjugative genomes are listed. The expected number of conjugative genomes was estimated based on a bootstrapped random selection process with 100 trials (null hypothesis), using the number of assays and the actual fraction of genomes with conjugative features (&#x2dc;51%).</p>
</fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="s2-6">
<title>2.6 Genome clustering by conjugative feature profile</title>
<p>The specific proteins transferred between bacteria are known to vary by conjugation feature, for example as demonstrated by the co-occurrence patterns of conjugation features and AMR proteins within genomes (<xref ref-type="fig" rid="F4">Figure 4</xref> and <xref ref-type="sec" rid="s9">Supplementary Figure S1</xref>). To demonstrate the structuring of bacterial populations by conjugation-cargo co-occurrence patterns, we generated the same co-occurrence matrix for all cargo proteins and all conjugative features within genomes that contained a high frequency of cargo proteins (<xref ref-type="fig" rid="F5">Figure 5</xref>). We then calculated the genome-genome Euclidean distance for all genomes in the co-occurrence matrix, using a vector of normalized conjugation features (see <italic>Methods</italic>, <xref ref-type="sec" rid="s9">Supplementary Figure S2</xref>). The results demonstrate clusters of genomes with similar conjugative features. While these clusters often reflect classical bacterial taxonomic structure, there are also instances of discordance between the clustering based on conjugation profile and traditional grouping based on taxonomy. These results reflect the evolutionary dynamics of bacterial populations, and suggest that the relative importance of vertical <italic>versus</italic> horizontal gene transfer events is highly variable. Such variability in the importance of HGT events has been previously reported, including differences in plasmid <italic>versus</italic> ICE-mediated exchange and interactions with bacterial host range (<xref ref-type="bibr" rid="B17">Cury et al., 2018</xref>). This finding has far-reaching and complex implications for applications that rely on a measure of phylogenetic relatedness, i.e., outbreak detection and source attribution. In some cases the use of the core genome may be sufficient to accurately reflect bacterial phylogenetic relatedness; while in others, the information in the core genome may obfuscate the true relationships between bacterial isolates. As WGS data become more widely used, these complexities must be considered, and in some cases, incorporated into phylogenetic analysis workflows.</p>
<p>The relational database underlying this work and the ggMOB tool is a necessary (yet not sufficient) component of improved interpretation and use of WGS data. We note that, in principle, one can use the co-occurrence matrix and vectorization procedure on genomic properties other than conjugative features. This provides a flexible and customizable approach for defining a different set of genomes of interest within the <italic>mobilome</italic>, which can then be used to (re)classify organisms not by name, but by genome-genome distance in a space of mobilization features. This capability could represent a powerful tool for improving our understanding of bacterial evolution while also informing the next generation of applied WGS computational and statistical pipelines.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s3">
<title>3 Discussion</title>
<p>The public availability of large scale genomic data makes it possible to apply cloud computing technology and big data techniques to study important phenomena in molecular and microbiology. Curating these data in a relational database with biologically structured entity relations (i.e., linking genomes, genes, proteins, domains, and metadata) provides a powerful method with which to ask biological questions about the data. We leveraged this approach in the current study of cargo and conjugation, which is an essential mechanism by which bacteria acquire new phenotypes, transmit molecular functions, and adapt to stress. Furthermore, these events are critical for understanding bacterial evolution and phylogeny (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>; <xref ref-type="bibr" rid="B1">Abby et al., 2012</xref>; <xref ref-type="bibr" rid="B6">Bellanger et al., 2014</xref>). Our work not only sheds light on conjugation-mediated cargo transfers between and within genera, but also demonstrates the ability of mining and analyzing large datasets in improving our understanding of bacterial evolutionary dynamics. The network of putative genus-genus conjugation features and candidate cargo genes can be dynamically visualized using the ggMOB tool, which supports hypothesis generation and testing related to intra- and inter-genus conjugation dynamics.</p>
<p>In our analysis we identified sets of proteins with the strongest evidence as conjugation and cargo proteins. This was accomplished by selecting only those proteins that exhibited both 100% sequence identity and co-occurrence in pairs of genomes containing identical conjugation-associated sequences. With this strict selection process, the putative cargo proteins exhibited a high degree of spatial correlation within assembled contigs (i.e., they were highly adjacent to each other, as well as to the conjugation protein itself). Other proteins in these genomes may also have been transferred (or are transferable) by bacterial conjugation, but they did not meet our strict selection criteria. Considering only strictly-selected candidate cargo proteins, we were able to profile the frequency of conjugation-mediated protein exchange within and between genera.</p>
<p>Our results suggest that conjugation-mediated exchange is not uncommon, affirming prior studies (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>; <xref ref-type="bibr" rid="B6">Bellanger et al., 2014</xref>). Conjugation-related proteins were observable in 51% of bacterial genomes and in 631 of 1,345 genera (approximately 47%). Frequency of intra- and inter-genus conjugation-mediated exchange varied significantly depending on the taxa involved, suggesting that taxonomy greatly influences genetic exchange of, e.g., AMR or pathogenicity proteins (<xref ref-type="bibr" rid="B19">Delavat et al., 2017</xref>). By quantifying this across a large database of high-quality WGS data, we measured the &#x201c;exchange likelihood&#x201d; between different genera. These likelihoods can be visualized dynamically in the ggMOB tool, which reveals distinct clusters of genera that share conjugative features with exact sequence match. This suggests that the likelihood of protein transfer varies substantially by genus pair, and that the bacterial composition within a given environment is an important consideration when attempting to evaluate mobilization potential within a microbial community (<xref ref-type="bibr" rid="B34">Lopatkin and Collin, 2020</xref>; <xref ref-type="bibr" rid="B56">Neil and Allard, 2021</xref>).</p>
<p>While we have conducted this analysis for a specific set of conjugation features (<xref ref-type="table" rid="T1">Table 1</xref>), the analytic approach can be applied to any MGE(s) and cargo protein(s) of interest. As such, our overall approach represents a method for obtaining a long-range evolutionary view of transfer likelihood between diverse bacterial taxa, including pathogens and commensal bacteria (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>). These baseline exchange likelihoods are critical parameters for risk analysis at the microbial community level, including for applications such as personalized microbiome medicine, and microbiome-centric surveillance.</p>
<p>Bacterial taxon is not the only significant driver of exchange likelihood; we also observed that putative, successful transfer events were more likely to involve cargo proteins that infer fitness advantage to the involved bacterial populations, such as AMR. While any gene can, in principle, be transmitted as a cargo gene in conjugative exchange, only a subset of transferred proteins will increase the fitness of the receiving organism. The likelihood of observing successful transfer depends on a large number of factors including the environment, the existing proteins in the recipient chromosome, the cargo proteins themselves, and the survival probability of the organism (<xref ref-type="bibr" rid="B16">Cohen et al., 2010</xref>).</p>
<p>Conjugation-mediated protein transfer that improves fitness may increase survival probability. Therefore, chromosomal arrangements that group <italic>fitness-conferring</italic> cargo proteins near the conjugation machinery will be observed more frequently than those arrangements that involve neutral or disadvantageous proteins. Conversely, very common proteins that aid in stress response may be less likely to be transferred as cargo, since the relative fitness advantage is diminished for proteins that are already likely to be present within a bacterium (i.e., proteins that confer redundant function). The particular stressor&#x2014;as well as the specific advantageous proteins of interest&#x2014;depend on phenotype of interest. This view is exemplified by the data in <xref ref-type="table" rid="T4">Table 4</xref> which shows that rare AMR proteins are more likely to be found as cargo in genomes that also contain conjugative proteins, as compared to genomes that do not. Conversely, common AMR proteins are less likely to be found in genomes that contain conjugative machinery. One might hypothesize that, with chromosomal rearrangement, nature effects a real world experiment to dynamically optimize cargo protein collections&#x2014;thereby spreading rare (but useful) proteins and gene combinations over time.</p>
<p>The particular cargo proteins shared between chromosomes varied by conjugation feature, as demonstrated by the AMR proteins analyzed in <xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F4">4</xref>. Considering all conjugation features used in this study, our results suggest that conjugation dynamics are important in structuring genomic content, and thus driving phylogenetic evolution. Based on <xref ref-type="fig" rid="F5">Figure 5</xref>, it seems that sometimes these evolutionary conjugation dynamics can sometimes overpower other taxonomic drivers, such that genus-level genomes do not always cluster together. To demonstrate this conjugation-driven phylogeny, we used the data in <xref ref-type="fig" rid="F5">Figure 5</xref> to generate <xref ref-type="fig" rid="F2">Figure 2</xref>, which represents the distance between all pairs of genomes based on Euclidean distance between their representations as normalized conjugation feature vectors. The resulting hierarchical clustering shows that the dominant conjugation features are represented in genomes across different genera and, conversely, that individual genera include genomes with differing conjugation profiles. This abrogation of genus-level taxonomy due to conjugation-related genomic content is an inevitable consequence of the inter-genus transfers visualized in ggMOB. Given the reality of conjugative exchange, there is no reason to expect that taxonomic classification by organism name will always predict the composition of conjugation-associated cargo proteins. However, by selecting genomes based on a particular phenotype of interest, it is possible to classify organisms and genome-genome distances based on a feature space defined by conjugation (or other mobilization) proteins, as in <xref ref-type="fig" rid="F2">Figure 2</xref>. Given the ubiquity and diversity of conjugation and other types of HGT (<xref ref-type="bibr" rid="B25">Guglielmini et al., 2011</xref>), these types of genome clustering techniques may provide crucial information about bacterial evolution that is not contained within traditional phylogenies. In this regard, the ability to filter the ggMOB data based on conjugation features of interest may particularly useful.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Individual genomes typically contained more than one conjugative feature (<xref ref-type="table" rid="T1">Table 1</xref>), and often contained more than one protein per feature. <bold>(A)</bold> Histogram (log frequency) of the number of conjugative features per genome, and <bold>(B)</bold> Histogram (log frequency) of the number of conjugative proteins per genome for all 106,433 genomes containing at least one conjugative feature.</p>
</caption>
<graphic xlink:href="fgene-13-1024577-g001.tif"/>
</fig>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Heatmap showing the relative genomic positions of conjugative features and putative cargo proteins for the 2,000 genomes with the greatest number of cargo proteins. Conjugative features are represented as color pixels based on the colors shown in <xref ref-type="table" rid="T1">Table 1</xref>, with yellow representing proteins assigned specific IPR codes and red representing protein families from the literature. Cargo proteins are shown in grey and other chromosomal DNA in white. Each genome is bit shifted to the left until the first conjugative feature is centered in the figure. Most genomes contained more than one conjugative protein (all contain at least one). The inset highlights the genomes at indices 1450&#x2013;1550 in order to expand a subset of the data.</p>
</caption>
<graphic xlink:href="fgene-13-1024577-g002.tif"/>
</fig>
</sec>
<sec sec-type="materials|methods" id="s4">
<title>4 Materials and methods</title>
<sec id="s4-1">
<title>4.1 Creation of relational database</title>
<p>Here we briefly describe the process used to create the relational database that underlies ggMOB; further details can be found at (<xref ref-type="bibr" rid="B58">Seabolt et al., 2020</xref>). First, we downloaded whole genome sequences from NCBI&#x2019;s Reference Sequence Database (RefSeq), which we then filtered to only obtain genomes that were identified as being of bacterial lineage, and as having an assembly level of &#x201c;Complete Genome&#x201d;. We added to this set of genomes non-assembled sequence data from NCBI&#x2019;s Short Read Archive (SRA) by first downloading all datasets that had the following criteria: (1) the data consisted of WGS data generated from bacteria, as defined according to their taxonomic lineage; (2) the data were Illumina short-read sequence data from DNA; and (3) the sequence data were paired-end. Long-read and transcriptomic data were not considered. We note that we downloadeded all the SRA data in FASTQ format using the SRA toolkit (<xref ref-type="bibr" rid="B69">Sugawara and Shumway, 2010</xref>), and assembled them into contigs using SPAdes (<xref ref-type="bibr" rid="B4">Bankevich et al., 2012</xref>). We discarded any genome assemblies that contained more than 150 contigs (of size &#x3e;500 bp) or had an N50 of less than 100 kbp. We note that only 48% of bacterial genomes met the aforementioned curation thresholds from the original corpus of SRA datasets. Next, we eliminated any assembled genomes in which a significant proportion of <italic>k</italic>-mers originated from multiple genomes across different genera. This removed another 13,044 genomes from consideration. This last step ensured all the genomes used for analysis were from a pure single bacterial isolate with valid genus-level classification, hence minimizing the probability of contamination. We obtained a total of 159,628 genome assemblies after filtering for all the above criteria, and a total of 186,887 genomes when including the genome assemblies from RefSeq.</p>
<p>Next, we annotated all the genomes using Prokka 1.12 (<xref ref-type="bibr" rid="B50">Prokka, 2014</xref>), resulting in the collation of the genome, gene, and protein data entities into CSV files. After annotation, we determined the protein domains using InterProScan 5.28&#x2013;67.0 (<xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>) with all available analyses provided by InterProScan (16). This resulted in 16 JSON files that were then parsed to create a set of CSV files. The annotation process yielded a total of 66,945,714 unique gene sequences; 51,362,178 unique protein sequences; and 138,327,556 unique protein domains along with related functional annotations.</p>
<p>Using the curated data, we created a relational database using IBM&#x2019;s DB2 system, which contained the following five different entity types: genomes, genes, proteins, protein domains, and functional annotations. These entities were determined by the above data curation, assembly and annotation steps; each entity in the database was stored using the MD5 hash of the sequence itself to create a unique identifier. Thus, we can quickly query for an entity within the database using the unique identifiers as a key. We stored the relations between entities as tables in the relational database, e.g., the genes corresponding to a particular genome in a table. We note this saves storage because unique sequences are stored only once in their respective tables and the tables point to all the parent entities in which they are found. Thus, while database construction required 1468 CPUs, 6TB RAM, and 160&#xa0;TB of hard drive space, the final relational database scales efficiently with the addition of new sequences (<xref ref-type="bibr" rid="B58">Seabolt et al., 2020</xref>).</p>
</sec>
<sec id="s4-2">
<title>4.2 Creation of ggMOB</title>
<p>After curation and annotation of the data, we identified all candidate conjugative and cargo proteins in order to create ggMOB. In particular, we used both the primary literature and the InterProScan coding system to generate a list of conjugative features for ggMOB. This led us to consider the following 12 InterProScan codes:<list list-type="simple">
<list-item>
<p>1. IPR005094 describes relaxases and mobilisation proteins, as exemplified by MobA/VirD2 (<xref ref-type="bibr" rid="B45">Pansegrau et al., 1993</xref>; <xref ref-type="bibr" rid="B13">Byrd and Matson, 1997</xref>; <xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>).</p>
</list-item>
<list-item>
<p>2. IPR011119 represents a domain found in Proteobacteria annotated as helicase, conjugative relaxase or nickase (<xref ref-type="bibr" rid="B67">Street et al., 2003</xref>; <xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>).</p>
</list-item>
<list-item>
<p>3. IPR014059 codes for a domain in the N-terminal region of a relaxase-helicase (TrwC) that acts in plasmid R388 conjugation. It has been associated with both DNA cleavage and strand transfer activities, and members of this family are frequently found in genomic proximity to conjugative proteins thought to indicate the presence of integrated plasmids when identified in bacterial chromosomes (<xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>; <xref ref-type="bibr" rid="B8">Boer et al., 2006</xref>).</p>
</list-item>
<list-item>
<p>4. IPR014129 represents proteins in the relaxosome complex, exemplified by TraI, which mediates the single-strand nicking and ATP-dependent unwinding of the plasmid molecule <italic>via</italic> two separate domains in the protein (<xref ref-type="bibr" rid="B36">Matson and Ragonese, 2005</xref>; <xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>).</p>
</list-item>
<list-item>
<p>5. IPR014862 represents a conserved domain found in the relaxosome complex, as exemplified by TrwC (<xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>; <xref ref-type="bibr" rid="B8">Boer et al., 2006</xref>).</p>
</list-item>
<list-item>
<p>6. IPR021300 represents a conserved domain observed in ICE elements in the protein family PFL_4695, and originally identified in <italic>Pseudomonas fluorescens</italic> Pf-5 (<xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>; <xref ref-type="bibr" rid="B37">Mavrodi et al., 2009</xref>).</p>
</list-item>
<list-item>
<p>7. IPR022303 describes a family of conjugative transfer ATPases representing predicted ATP-binding proteins associated with DNA conjugative transfer. They are found both in plasmids and bacterial chromosomal regions that appear to derive from integrative elements such as conjugative transposons.</p>
</list-item>
<list-item>
<p>8. IPR025955 describes a family of TraC-related proteins observed in Proteobacteria. TraC is a cytoplasmic, membrane protein encoded by the F transfer region of conjugative plasmids, and is required for the assembly of the F pilus structure, which creates and maintains contact between the donor and recipient cells during conjugation. The family includes predicted ATPases associated with DNA conjugative transfer (<xref ref-type="bibr" rid="B57">Schandel et al., 1992</xref>; <xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>).</p>
</list-item>
<list-item>
<p>9. IPR022391 represents the N-terminal domain of proteins associated with conjugative relaxases in the PFGI-1 class, which includes TraI putative relaxases required for ICE function. While these relaxases are similar in function to TraI relaxases of the F plasmid, they have no sequence homology (<xref ref-type="bibr" rid="B52">Quevillon et al., 2005</xref>).</p>
</list-item>
<list-item>
<p>10. IPR011952 represents CD-NTase-associated protein 3, a group of proteins that function as part of CBASS (cyclic oligonucleotide-based antiphage signaling system), which provides immunity against bacteriophages (<xref ref-type="bibr" rid="B39">Millman et al., 2020</xref>).</p>
</list-item>
<list-item>
<p>11. IPR014136 encompasses TraA, a Ti-type conjugative transfer relaxase that likely nicks the OriT site and unwinds the coiled plasmid prior to conjugative transfer (similar to TraI(F) in this respect) (<xref ref-type="bibr" rid="B26">Harris et al., 1999</xref>).</p>
</list-item>
<list-item>
<p>12. IPR020369 represents mobilization protein B (MobB), which is thought to play a role in conjugative exchange by presenting MobA and its covalently-linked plasmid DNA to the conjugative pore for subsequent export (<xref ref-type="bibr" rid="B38">Meyer, 2011</xref>).</p>
</list-item>
</list>
</p>
<p>We supplemented the IPR features with additional conjugative features that provide essential functions in the conjugation process, including conjugative relaxases, nickases, helicases, and other mobilisation proteins (<xref ref-type="bibr" rid="B57">Schandel et al., 1992</xref>; <xref ref-type="bibr" rid="B45">Pansegrau et al., 1993</xref>; <xref ref-type="bibr" rid="B13">Byrd and Matson, 1997</xref>; <xref ref-type="bibr" rid="B8">Boer et al., 2006</xref>) (<xref ref-type="table" rid="T1">Table 1</xref>). These conjugative features contain substantial sequence diversity, (<xref ref-type="bibr" rid="B22">Frost et al., 2005</xref>; <xref ref-type="bibr" rid="B75">Wozniak and Waldor, 2010</xref>; <xref ref-type="bibr" rid="B49">Perry and Wright, 2013</xref>; <xref ref-type="bibr" rid="B27">Johnson and Grossman, 2015</xref>; <xref ref-type="bibr" rid="B60">Singer et al., 2016</xref>), but also represent conserved domains involved in the machinery required for conjugative transfer. Using standard SQL queries, we obtained a list of the unique identifiers that have one or more of the features described above, resulting in a list of 28,042 candidate conjugation proteins. From this list, we removed those that appeared exactly in only a single genome, which further reduced the list of potential conjugation proteins to 15,398 across 95,781 genomes. We refer to this resulting set of genomes as <italic>conjugative genomes</italic> because they contain putative conjugation features (<xref ref-type="sec" rid="s9">Supplementary Table S4</xref>). We note that these genomes represent 51% of all genomes in the relational database.</p>
<p>Next, we performed SQL queries in order to identify proteins most likely to be cargo based on evidence of conjugative transfer. To minimize misclassification of proteins as cargo, we applied two rules: (1) the proteins had to be present in at least two genomes with the same conjugative protein; and (2) they could not be present in any non-conjugative genome. To accomplish the query, we first queried the database for all proteins in the 95,781 conjugative genomes, which produced a list of 387,682,038 distinct &#x3c; conjugative genome accession number, protein &#x3e; tuples. In many cases a unique sequence was observed in more than one genome, and therefore, in total there were 21,207,794 distinct protein sequences in the set of conjugative genomes. Next, we filtered this list in order to identify the set of proteins that appeared in two or more conjugative genomes. To further reduce false positive identification of transfer by conjugation (vs. being vertically transferred), we discarded any protein that appeared in any of the 99,052 non-conjugative genomes. With this strict selection process, we identified 11,276,651 distinct sequences that we refer to as <italic>cargo proteins</italic>, i.e., proteins with the greatest evidence of conjugative transfer. Lastly, we tabulated these results to produce a list of triples of the form &#x3c; cargo protein, conjugative genome A, conjugative genome B&#x3e; which describe genome A and genome B contained at least one identical conjugative protein sequence, yielding a total of 4,938,737,476 putative transfers. We used this file as input to a custom python script that identifies all intra- and inter-genera cargo protein transfers for each protein by comparing all pairs of genomes in order to identify the intersection of conjugative proteins of each pair of genomes, and the cargo proteins (if any) in this intersection. The output of this script was used to create the ggMOB network, which contains a node for each genus, and an edge between any pair of nodes in which the value of co-occurrence of &#x3c;conjugative protein, cargo protein&#x3e; is non-empty (see <ext-link ext-link-type="uri" xlink:href="https://github.com/Ruiz-HCI-Lab/ggMOB">https://github.com/Ruiz-HCI-Lab/ggMOB</ext-link> for source files and code).</p>
</sec>
<sec id="s4-3">
<title>4.3 Additional analyses</title>
<sec id="s4-3-1">
<title>4.3.1 Conjugation and cargo gene proximity</title>
<p>To characterize the genomic proximity of conjugative and cargo genes within the conjugative genome pairs, we used our compiled list of genera, genomes, conjugative and cargo proteins, along with Prokka&#x2019;s accession index, which indicates the position of a gene or protein sequence within the assembled sequences. While this approach was limited by the fact that the order of assembled sequences is unknown, the Prokka index does indicate position of annotated sequences within each assembled sequence; this information was used in a visual display of genomic distance (<xref ref-type="fig" rid="F2">Figure 2</xref>).</p>
</sec>
<sec id="s4-3-2">
<title>4.3.2 Characterizing AMR genes</title>
<p>We identified all AMR proteins by querying our relational database with all sequences in the MEGARes database (<xref ref-type="bibr" rid="B30">Lakin et al., 2016</xref>). To obtain consistent annotations, we annotated the sequences in MEGARes in the same format as was used to annotate the set of all proteins in the database. We note that we were able to maintain high confidence that these annotations represent AMR proteins because the annotations were derived by exact sequence matching. Next, we extracted the set of cargo proteins with (self-consistent) names that matched any MEGARes AMR protein name. These data were then used to compute the frequency of observing each AMR gene in genomes that contained and did not contain conjugative features.</p>
</sec>
<sec id="s4-4">
<title>4.3.3 NCBI antibiotic susceptibility testing BioSample data</title>
<p>To analyze associations between phenotypic AMR and genomic conjugation features, we retrieved metadata for each NCBI accession that contained antimicrobial susceptibility testing that contained AST data, which include genomic accession number for each isolate, the antibiotic compound(s) against which it was tested, the AST type, and the phenotypic outcome (resistant, susceptible, or intermediate). We only considered those isolates with a resistant phenotypic outcome to be resistant. By linking the BioSample accession with the SRA accessions in our relational database, we were able to identify genomes for which corresponding AST data were available. These genomes were used in our analysis of phenotyic AMR and conjugative features.</p>
</sec>
<sec id="s4-5">
<title>4.3.4 Classification of plasmid and conjugation proteins</title>
<p>We note that many of the InterPro codes listed in <xref ref-type="table" rid="T1">Table 1</xref> contain conjugative machinery found in both plasmids and ICEs. Since these two groups of MGEs exhibit unique microbial ecological and epidemiological dynamics regarding AMR, we attempted to further annotate conjugative proteins identified within our set of genomes. To accomplish this, we first queried NCBI for bacterial plasmids. All of these assembled bacterial plasmids were downloaded from NCBI and annotated <italic>via</italic> our Prokka and InterProScan pipelines. The annotated plasmid associated proteins were then placed in a database table. The MD5 hash was used as the primary key for entries in this table, as was true for every sequence entity in the FGP database. Determining whether a protein had been observed on a plasmid in any of the reference genomes was then accomplished by querying for the primary (i.e., FGP) key of each protein within the table of plasmid-associated proteins. If the primary key existed in both tables, we considered that protein to be a plasmid-associated protein. These data were used in the analyses shown in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>AMR Protein Detection in Plasmids versus Conjugative Genomes. 2D histogram showing the probability that AMR proteins were found in conjugative genomes (<italic>x</italic>-axis) <italic>versus</italic> the fraction of AMR proteins observed on plasmids (<italic>y</italic>-axis). Independent of presence on conjugative genomes, 5%&#x2013;10% of AMR proteins were observed on plasmids, whereas the majority of AMR proteins were found in conjugative genomes.</p>
</caption>
<graphic xlink:href="fgene-13-1024577-g003.tif"/>
</fig>
</sec>
<sec id="s4-6">
<title>4.3.5 Tabulation of data</title>
<p>Conjugative genomes were tabulated by genus as shown in <xref ref-type="table" rid="T2">Table 2</xref>. Observed conjugative features from <xref ref-type="table" rid="T1">Table 1</xref> were tabulated by genome for the analysis shown in <xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F5">5</xref>. Similarly, proteins assigned AMR-associated annotations were tabulated by number of conjugative and non-conjugative genomes, and the fraction of unique sequences observed in plasmids was tabulated as well (See <xref ref-type="fig" rid="F4">Figure 4</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Co-occurrence of AMR proteins with conjugative features, for the 138 AMR proteins observed in conjugative genomes with a frequency greater than 5x the frequency of observation in non-conjugative genomes. Of these AMR proteins, 43 are <italic>only</italic> observed in conjugative genomes.</p>
</caption>
<graphic xlink:href="fgene-13-1024577-g004.tif"/>
</fig>
</sec>
<sec id="s4-7">
<title>4.3.6 Hierarchical clustering and co-occurrence</title>
<p>Hierarchical clustering was used to characterize the co-occurrence of proteins or genomes by conjugation feature (<xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F4">4</xref>, <xref ref-type="fig" rid="F5">5</xref>. The co-occurrence matrix was generated using the Seaborn <monospace>clustermap</monospace> algorithm, which performs single linkage clustering to generate heatmaps and dendrograms (<xref ref-type="bibr" rid="B73">Waskom, 2015</xref>). The vector of features used to generate the heatmap shown in <xref ref-type="fig" rid="F2">Figure 2</xref> was the vector of conjugation features for each genome, which in order to compute the (Euclidean) distance between each genome. Again, Seaborn <monospace>clustermap</monospace> was used for hierarchical clustering and visualization.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Genome-IPR Co-Occurence Map. Co-occurrence of conjugation features by genome, for the 6,000 genomes with the highest cargo protein fraction and the 500 genomes with the rarest conjugation features (see text). Co-occurrence of particular conjugation features does vary by taxonomic group.</p>
</caption>
<graphic xlink:href="fgene-13-1024577-g005.tif"/>
</fig>
</sec>
</sec>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article <xref ref-type="sec" rid="s9">Supplementary Material</xref> and at <ext-link ext-link-type="uri" xlink:href="https://github.com/Ruiz-HCI-Lab/ggMOB">https://github.com/Ruiz-HCI-Lab/ggMOB</ext-link>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>GN, JK, IT, and IS performed and designed research, compiled supporting data, analyzed data, and wrote the paper. GN and AA developed big data visualizations, classified AMR genes and assay data, and contributed to the paper. ES built the database, pipeline, and contributed to the paper. CB provided input on research design, methods and visualizations, and contributed to the paper. NN proposed the study, provided input into the research design, and wrote the paper. JR built the online ggMOB dynamic network and contributed to the paper.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>Financial support for this study was provided by the National Institute of Allergy and Infectious Diseases (NIAID) of the US. National Institutes of Health (NIH), Project No. 1R01AI141810-01 and the National Institute of Food and Agriculture of the United States Department of Agriculture (USDA NIFA), Project No. MINV62-058.</p>
</sec>
<ack>
<p>The authors would like to acknowledge contributions from M. Roth, H. Krishnareddy, K. Clarkson, and E. Kandogan.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>ES and AA are currently employed by IBM, GN and JK were employed by IBM at the time of this work. JK is currently employed by Altos Labs.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fgene.2022.1024577/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fgene.2022.1024577/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material>
<label>Supplementary Figure S1</label>
<caption>
<p>Co-occurrence of AMR proteins with conjugative features.Co-occurrence of AMR proteins with conjugative features for the 29 AMR proteins observed in non-conjugative genomes with a frequency at least 5x the frequency of observation in conjugative genomes..</p>
</caption>
</supplementary-material>
<supplementary-material>
<label>Supplementary Figure S2</label>
<caption>
<p>Heatmap of Genome-Genome Distances Based on Conjugation Feature Profiles. Genome-genome Euclidean distance between vectors of conjugation features for the 6500 genomes used in 5. For visualization purposes, 1 in 75 labels were rendered on each axis. The figure shows that different sets of genomes cluster based on different co-occurring conjugation features..</p>
</caption>
</supplementary-material>
<supplementary-material xlink:href="DataSheet4.CSV" id="SM1" mimetype="application/CSV" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet3.XLSX" id="SM2" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.CSV" id="SM3" mimetype="application/CSV" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet2.XLSX" id="SM4" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abby</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Tannier</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Gouy</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Daubin</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Lateral gene transfer as a support for the tree of life</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>109</volume> (<issue>13</issue>), <fpage>4962</fpage>&#x2013;<lpage>4967</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1116871109</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alderliesten</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Duxbury</surname>
<given-names>S. J. N.</given-names>
</name>
<name>
<surname>Zwart</surname>
<given-names>M. P.</given-names>
</name>
<name>
<surname>de Visser</surname>
<given-names>J. A. G. M.</given-names>
</name>
<name>
<surname>Stegeman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fischer</surname>
<given-names>E. A. J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Effect of donor-recipient relatedness on the plasmid conjugation frequency: A meta-analysis</article-title>. <source>BMC Microbiol.</source> <volume>20</volume>, <fpage>135</fpage>. <pub-id pub-id-type="doi">10.1186/s12866-020-01825-4</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bacic</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Parker</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Stagg</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Whitley</surname>
<given-names>H. P.</given-names>
</name>
<name>
<surname>Wells</surname>
<given-names>W. G.</given-names>
</name>
<name>
<surname>Jacob</surname>
<given-names>L. A.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Genetic and structural analysis of the Bacteroides conjugative transposon CTn341</article-title>. <source>J. Bacteriol.</source> <volume>187</volume> (<issue>8</issue>), <fpage>2858</fpage>&#x2013;<lpage>2869</lpage>. <pub-id pub-id-type="doi">10.1128/JB.187.8.2858-2869.2005</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bankevich</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nurk</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Antipov</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Gurevich</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Dvorkin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kulikov</surname>
<given-names>A. S.</given-names>
</name>
<etal/>
</person-group> (<year>2012</year>). <article-title>SPAdes: A new genome assembly algorithm and its applications to single-cell sequencing</article-title>. <source>J. Comput. Biol.</source> <volume>19</volume> (<issue>5</issue>), <fpage>455</fpage>&#x2013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.1089/cmb.2012.0021</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beaber</surname>
<given-names>J. W.</given-names>
</name>
<name>
<surname>Hochhut</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Waldor</surname>
<given-names>M. K.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Genomic and functional analyses of SXT, an integrating antibiotic resistance gene transfer element derived from <italic>Vibrio cholerae</italic>
</article-title>. <source>J. Bacteriol.</source> <volume>184</volume> (<issue>15</issue>), <fpage>4259</fpage>&#x2013;<lpage>4269</lpage>. <pub-id pub-id-type="doi">10.1128/jb.184.15.4259-4269.2002</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bellanger</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Payot</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Leblond-Bourget</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gu&#xe9;don</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Conjugative and mobilizable genomic islands in bacteria: Evolution and diversity</article-title>. <source>FEMS Microbiol. Rev.</source> <volume>38</volume> (<issue>4</issue>), <fpage>720</fpage>&#x2013;<lpage>760</lpage>. <pub-id pub-id-type="doi">10.1111/1574-6976.12058</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bellanger</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Morel</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Choulet</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Pavlovic</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Mullany</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Conjugative transfer of the integrative conjugative elements ICESt1 and ICESt3 from Streptococcus thermophilus</article-title>. <source>J. Bacteriol.</source> <volume>191</volume> (<issue>8</issue>), <fpage>2764</fpage>&#x2013;<lpage>2775</lpage>. <pub-id pub-id-type="doi">10.1128/JB.01412-08</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boer</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Russi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Guasch</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lucas</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Blanco</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>P&#xe9;rez-Luque</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Unveiling the molecular mechanism of a conjugative relaxase: The structure of TrwC complexed with a 27-mer DNA comprising the recognition hairpin and the cleavage site</article-title>. <source>J. Mol. Biol.</source> <volume>358</volume> (<issue>3</issue>), <fpage>857</fpage>&#x2013;<lpage>869</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2006.02.018</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>B&#xf6;ltner</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>MacMahon</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Pembroke</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Strike</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Osborn</surname>
<given-names>A. M.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>R391: A conjugative integrating mosaic comprised of phage, plasmid, and transposon elements</article-title>. <source>J. Bacteriol.</source> <volume>184</volume> (<issue>18</issue>), <fpage>5158</fpage>&#x2013;<lpage>5169</lpage>. <pub-id pub-id-type="doi">10.1128/jb.184.18.5158-5169.2002</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Botelho</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mourao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Roberts</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Peixe</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Comprehensive genome data analysis establishes a triple whammy of carbapenemases, ICEs and multiple clinically relevant bacteria</article-title>. <source>Microb. Genom.</source> <volume>6</volume>. <pub-id pub-id-type="doi">10.1099/mgen.0.000424</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burrus</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Marrero</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Waldor</surname>
<given-names>M. K.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>The current ICE age: Biology and evolution of SXT-related integrating conjugative elements</article-title>. <source>Plasmid</source> <volume>55</volume> (<issue>3</issue>), <fpage>173</fpage>&#x2013;<lpage>183</lpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2006.01.001</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burrus</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Pavlovic</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Decaris</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gu&#xe9;don</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>The ICESt1 element of Streptococcus thermophilus belongs to a large family of integrative and conjugative elements that exchange modules and change their specificity of integration</article-title>. <source>Plasmid</source> <volume>48</volume> (<issue>2</issue>), <fpage>77</fpage>&#x2013;<lpage>97</lpage>. <pub-id pub-id-type="doi">10.1016/s0147-619x(02)00102-6</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Byrd</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Matson</surname>
<given-names>S. W.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Nicking by transesterification: The reaction catalysed by a relaxase</article-title>. <source>Mol. Microbiol.</source> <volume>25</volume> (<issue>6</issue>), <fpage>1011</fpage>&#x2013;<lpage>1022</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-2958.1997.5241885.x</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chan</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Sutton</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>DePew</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Krishnakumar</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X. Z.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>A novel method of consensus pan-chromosome assembly and large-scale comparative analysis reveal the highly flexible pan-genome of Acinetobacter baumannii</article-title>. <source>Genome Biol.</source> <volume>16</volume>, <fpage>143</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-015-0701-6</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clewell</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Flannagan</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Jaworski</surname>
<given-names>D. D.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Unconstrained bacterial promiscuity: The tn916&#x2013;tn1545 family of conjugative transposons</article-title>. <source>Trends Microbiol.</source> <volume>3</volume> (<issue>6</issue>), <fpage>229</fpage>&#x2013;<lpage>236</lpage>. <pub-id pub-id-type="doi">10.1016/s0966-842x(00)88930-1</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Gophna</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Pupko</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>The complexity hypothesis revisited: Connectivity rather than function constitutes a barrier to horizontal gene transfer</article-title>. <source>Mol. Biol. Evol.</source> <volume>28</volume> (<issue>4</issue>), <fpage>1481</fpage>&#x2013;<lpage>1489</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msq333</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cury</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Oliveira</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>de la Cruz</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Rocha</surname>
<given-names>E. P. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Host range and genetic plasticity explain the coexistence of integrative and extrachromosomal mobile genetic elements</article-title>. <source>Mol. Biol. Evol.</source> <volume>35</volume> (<issue>9</issue>), <fpage>2850</fpage>&#x2013;<lpage>2239</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msy182</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cury</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Touchon</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rocha</surname>
<given-names>E. P. C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Integrative and conjugative elements and their hosts: Composition, distribution and organization</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume> (<issue>15</issue>), <fpage>8943</fpage>&#x2013;<lpage>8956</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkx607</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Delavat</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Miyazaki</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Carraro</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Pradervand</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>van der Meer</surname>
<given-names>J. R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The hidden life of integrative and conjugative elements</article-title>. <source>FEMS Microbiol. Rev.</source> <volume>41</volume> (<issue>4</issue>), <fpage>512</fpage>&#x2013;<lpage>537</lpage>. <pub-id pub-id-type="doi">10.1093/femsre/fux008</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Everitt</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Didelot</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Batty</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Knox</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>B. C.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Mobile elements drive recombination hotspots in the core genome of <italic>Staphylococcus aureus</italic>
</article-title>. <source>Nat. Commun.</source> <volume>5</volume>, <fpage>3956</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms4956</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Finn</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Attwood</surname>
<given-names>T. K.</given-names>
</name>
<name>
<surname>Babbitt</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Bateman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bork</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Bridge</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Interpro in 2017 &#x2013; beyond protein family and domain annotations</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume> (<issue>D1</issue>), <fpage>D190-D199</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1107</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frost</surname>
<given-names>L. S.</given-names>
</name>
<name>
<surname>Leplae</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Summers</surname>
<given-names>A. O.</given-names>
</name>
<name>
<surname>Toussaint</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Mobile genetic elements: The agents of open source evolution</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>3</volume> (<issue>9</issue>), <fpage>722</fpage>&#x2013;<lpage>732</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro1235</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garnier</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Taourit</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Glaser</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Courvalin</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Galimand</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Characterization of transposon Tn1549, conferring VanB-type resistance in Enterococcus spp</article-title>. <source>Microbiology</source> <volume>146</volume> (<issue>6</issue>), <fpage>1481</fpage>&#x2013;<lpage>1489</lpage>. <pub-id pub-id-type="doi">10.1099/00221287-146-6-1481</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gaston</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Poyet</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Groussin</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>An omics-based framework for assessing the health risk of antimicrobial resistance genes</article-title>. <source>Nat. Commun.</source> <volume>12</volume>, <fpage>4765</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-021-25096-3</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guglielmini</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Quintais</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Garcill&#xe1;n-Barcia</surname>
<given-names>M. P.</given-names>
</name>
<name>
<surname>de La Cruz</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Rocha</surname>
<given-names>E. P. C.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The repertoire of ICE in prokaryotes underscores the unity, diversity, and ubiquity of conjugation</article-title>. <source>PLoS Genet.</source> <volume>7</volume> (<issue>8</issue>), <fpage>e1002222</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1002222</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harris</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Sholl</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Conrad</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Dresser</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Silverman</surname>
<given-names>P. M.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Interaction between the F plasmid TraA (F-pilin) and TraQ proteins</article-title>. <source>Mol. Microbiol.</source> <volume>34</volume> (<issue>4</issue>), <fpage>780</fpage>&#x2013;<lpage>791</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-2958.1999.01640.x</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johnson</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Grossman</surname>
<given-names>A. D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Integrative and conjugative elements (ICEs): What they do and how they work</article-title>. <source>Annu. Rev. Genet.</source> <volume>49</volume>, <fpage>577</fpage>&#x2013;<lpage>601</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-genet-112414-055018</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klockgether</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Reva</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Larbig</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>T&#xfc;mmler</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Sequence analysis of the mobile genome island pKLC102 of <italic>Pseudomonas aeruginosa</italic> C</article-title>. <source>J. Bacteriol.</source> <volume>186</volume> (<issue>2</issue>), <fpage>518</fpage>&#x2013;<lpage>534</lpage>. <pub-id pub-id-type="doi">10.1128/jb.186.2.518-534.2004</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koraimann</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wagner</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Social behavior and decision making in bacterial conjugation</article-title>. <source>Front. Cell.. Infect. Microbiol.</source> <volume>4</volume>, <fpage>54</fpage>. <pub-id pub-id-type="doi">10.3389/fcimb.2014.00054</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lakin</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Dean</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Noyes</surname>
<given-names>N. R.</given-names>
</name>
<name>
<surname>Dettenwanger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ross</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Doster</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>MEGARes: An antimicrobial resistance database for high throughput sequencing</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume> (<issue>D1</issue>), <fpage>D574-D580</fpage>&#x2013;<lpage>D580</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1009</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lechner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schmitt</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Bauer</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hot</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hubans</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Levillain</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Genomic island excisions in Bordetella petrii</article-title>. <source>BMC Microbiol.</source> <volume>9</volume> (<issue>1</issue>), <fpage>141</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2180-9-141</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Grossman</surname>
<given-names>A. D.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Bacillus subtilis conjugative transposon ICEBs1 mobilizes plasmids lacking dedicated mobilization functions</article-title>. <source>J. Bacteriol.</source> <volume>194</volume> (<issue>12</issue>), <fpage>3165</fpage>&#x2013;<lpage>3172</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00301-12</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Logan</surname>
<given-names>L. K.</given-names>
</name>
<name>
<surname>Weinstein</surname>
<given-names>R. A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The epidemiology of carbapenem-resistant Enterobacteriaceae: The impact and evolution of a global menace</article-title>. <source>J. Infect. Dis.</source> <volume>215</volume> (<issue>1</issue>), <fpage>S28</fpage>&#x2013;<lpage>S36</lpage>. <comment>S28&#x2013;S36</comment>. <pub-id pub-id-type="doi">10.1093/infdis/jiw282</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lopatkin</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Collin</surname>
<given-names>J. J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predictive biology: Modelling, understanding and harnessing microbial complexity</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>18</volume>, <fpage>507</fpage>&#x2013;<lpage>520</lpage>. <pub-id pub-id-type="doi">10.1038/s41579-020-0372-5</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mart&#xed;nez</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Coque</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>Baquero</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>What is a resistance gene? Ranking risk in resistomes</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>13</volume> (<issue>2</issue>), <fpage>116</fpage>&#x2013;<lpage>123</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro3399</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matson</surname>
<given-names>S. W.</given-names>
</name>
<name>
<surname>Ragonese</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>The F-plasmid TraI protein contains three functional domains required for conjugative DNA strand transfer</article-title>. <source>J. Bacteriol.</source> <volume>187</volume> (<issue>2</issue>), <fpage>697</fpage>&#x2013;<lpage>706</lpage>. <pub-id pub-id-type="doi">10.1128/JB.187.2.697-706.2005</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mavrodi</surname>
<given-names>D. V.</given-names>
</name>
<name>
<surname>Loper</surname>
<given-names>J. E.</given-names>
</name>
<name>
<surname>Paulsen</surname>
<given-names>I. T.</given-names>
</name>
<name>
<surname>Thomashow</surname>
<given-names>L. S.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Mobile genetic elements in the genome of the beneficial rhizobacterium Pseudomonas fluorescens Pf-5</article-title>. <source>BMC Microbiol.</source> <volume>9</volume> (<issue>1</issue>), <fpage>8</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2180-9-8</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meyer</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Functional organization of MobB, a small protein required for efficient conjugal transfer of plasmid R1162</article-title>. <source>J. Bacteriol.</source> <volume>193</volume> (<issue>15</issue>), <fpage>3904</fpage>&#x2013;<lpage>3911</lpage>. <pub-id pub-id-type="doi">10.1128/JB.05084-11</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Millman</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Melamed</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Amitai</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Sorek</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Diversity and classification of cyclic-oligonucleotide-based anti-phage signalling systems</article-title>. <source>Nat. Microbiol.</source> <volume>5</volume> (<issue>12</issue>), <fpage>1608</fpage>&#x2013;<lpage>1615</lpage>. <pub-id pub-id-type="doi">10.1038/s41564-020-0777-y</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mohd-Zain</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Turner</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Cerdeno-T&#xe1;rraga</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Lilley</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Inzana</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Duncan</surname>
<given-names>A. J.</given-names>
</name>
<etal/>
</person-group> (<year>2004</year>). <article-title>Transferable antibiotic resistance elements in Haemophilus influenzae share a common evolutionary origin with a diverse family of syntenic genomic islands</article-title>. <source>J. Bacteriol.</source> <volume>186</volume> (<issue>23</issue>), <fpage>8114</fpage>&#x2013;<lpage>8122</lpage>. <pub-id pub-id-type="doi">10.1128/JB.186.23.8114-8122.2004</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Obi</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Vayla</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>De Gannes</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Berres</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Walker</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pavelec</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>The integrative conjugative element clc (ICEclc) of <italic>Pseudomonas aeruginosa</italic> JB2</article-title>. <source>Front. Microbiol.</source> <volume>9</volume>, <fpage>1532</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2018.01532</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oh</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pruden</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Heath</surname>
<given-names>L. S.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>MetaCompare: A computational pipeline for prioritizing environmental resistome risk</article-title>. <source>FEMS Microbiol. Ecol.</source> <volume>94</volume> (<issue>6</issue>), <fpage>fiy079</fpage>. <pub-id pub-id-type="doi">10.1093/femsec/fiy079</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Osorio</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Marrero</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wozniak</surname>
<given-names>R. A. F.</given-names>
</name>
<name>
<surname>Lemos</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Burrus</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Waldor</surname>
<given-names>M. K.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Genomic and functional analysis of ICEPdaSpa1, a fish-pathogen-derived SXT-related integrating conjugative element that can mobilize a virulence plasmid</article-title>. <source>J. Bacteriol.</source> <volume>190</volume> (<issue>9</issue>), <fpage>3353</fpage>&#x2013;<lpage>3361</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00109-08</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paauw</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Leverstein-van Hall</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Verhoef</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fluit</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Evolution in quantum leaps: Multiple combinatorial transfers of HPI and other genetic modules in Enterobacteriaceae</article-title>. <source>PLoS ONE</source> <volume>5</volume> (<issue>1</issue>), <fpage>e8662</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0008662</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pansegrau</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Schoumacher</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hohn</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lanka</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Site-specific cleavage and joining of single-stranded DNA by VirD2 protein of agrobacterium tumefaciens Ti plasmids: Analogy to bacterial conjugation</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>90</volume> (<issue>24</issue>), <fpage>11538</fpage>&#x2013;<lpage>11542</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.90.24.11538</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parker</surname>
<given-names>B. J.</given-names>
</name>
<name>
<surname>Wearsch</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Veloo</surname>
<given-names>A. C. M.</given-names>
</name>
<name>
<surname>Rodriguez-Palacios</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The genus Alistipes: Gut bacteria with emerging implications to inflammation, cancer, and mental health</article-title>. <source>Front. Immunol.</source> <volume>11</volume>, <fpage>906</fpage>. <pub-id pub-id-type="doi">10.3389/fimmu.2020.00906</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Partridge</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Kwong</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Firth</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Jensen</surname>
<given-names>S. O.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Mobile genetic elements associated with antimicrobial resistance</article-title>. <source>Clin. Microbiol. Rev.</source> <volume>31</volume>. <pub-id pub-id-type="doi">10.1128/cmr.00088-17</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peed</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Parker</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>C. J.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Genetic and functional analyses of the mob operon on conjugative transposon CTn341 from Bacteroides spp</article-title>. <source>J. Bacteriol.</source> <volume>192</volume> (<issue>18</issue>), <fpage>4643</fpage>&#x2013;<lpage>4650</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00317-10</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perry</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wright</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The antibiotic resistance &#x201c;mobilome&#x201d;: Searching for the link between environment and clinic</article-title>. <source>Front. Microbiol.</source> <volume>4</volume>, <fpage>138</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2013.00138</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prokka</surname>
<given-names>T. S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Prokka: Rapid prokaryotic genome annotation</article-title>. <source>Bioinformatics</source> <volume>30</volume> (<issue>14</issue>), <fpage>2068</fpage>&#x2013;<lpage>2069</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu153</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qiu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Gurkar</surname>
<given-names>A. U.</given-names>
</name>
<name>
<surname>Lory</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Interstrain transfer of the large pathogenicity island (PAPI-1) of <italic>Pseudomonas aeruginosa</italic>
</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>103</volume> (<issue>52</issue>), <fpage>19830</fpage>&#x2013;<lpage>19835</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0606810104</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quevillon</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>SilVentoinen</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Pillai</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>HarteN.</surname>
</name>
<name>
<surname>MulderN.</surname>
</name>
<name>
<surname>ApweileR</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>InterProScan: Protein domains identifier</article-title>. <source>Nucleic Acids Res.</source> <volume>33</volume> (<issue>2</issue>), <fpage>W116</fpage>&#x2013;<lpage>W120</lpage>. <comment>&#x2013;W120</comment>. <pub-id pub-id-type="doi">10.1093/nar/gki442</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Ramsay</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Ronson</surname>
<given-names>C. W.</given-names>
</name>
</person-group> (<year>2015</year>). <source>Genetic regulation of symbiosis island transfer in Mesorhizobium loti</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>John Wiley &#x26; Sons</publisher-name>, <fpage>219</fpage>.</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roberts</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Mullany</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Tn916-like genetic elements: A diverse group of modular mobile elements conferring antibiotic resistance</article-title>. <source>FEMS Microbiol. Rev.</source> <volume>35</volume> (<issue>5</issue>), <fpage>856</fpage>&#x2013;<lpage>871</lpage>. <pub-id pub-id-type="doi">10.1111/j.1574-6976.2011.00283.x</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roche</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Flechard</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lallier</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Reperant</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bree</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pascal</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>ICEEc2, a new integrative and conjugative element belonging to the pKLC102/PAGI-2 family, identified in <italic>Escherichia coli</italic> strain BEN374</article-title>. <source>J. Bacteriol.</source> <volume>192</volume> (<issue>19</issue>), <fpage>5026</fpage>&#x2013;<lpage>5036</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00609-10</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Neil</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Allard</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Molecular mechanisms influencing bacterial conjugation in the intestinal microbiota</article-title>. <source>Front. Microbiol.</source> <volume>12</volume>, <fpage>673260</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2021.673260</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schandel</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Muller</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Webster</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Localization of TraC, a protein involved in assembly of the F conjugative pilus</article-title>. <source>J. Bacteriol.</source> <volume>174</volume> (<issue>11</issue>), <fpage>3800</fpage>&#x2013;<lpage>3806</lpage>. <pub-id pub-id-type="doi">10.1128/jb.174.11.3800-3806.1992</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seabolt</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Nayar</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Krishnareddy</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Agarwal</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Beck</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Terrizzano</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Functional genomics platform, A cloud-based platform for studying microbial life at scale</article-title>. <source>IEEE/ACM Trans. Comput. Biol. Bioinform.</source> <volume>1</volume> (<issue>&#x2013;1</issue>), <fpage>940</fpage>&#x2013;<lpage>952</lpage>. <pub-id pub-id-type="doi">10.1109/TCBB.2020.3021231</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sheppard</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Beddis</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Barraclough</surname>
<given-names>T. G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The role of hosts, plasmids and environment in determining plasmid transfer rates: A meta-analysis</article-title>. <source>Plasmid</source> <volume>108</volume>, <fpage>102489</fpage>. <pub-id pub-id-type="doi">10.1016/j.plasmid.2020.102489</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singer</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Shaw</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Rhodes</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Hart</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Review of antimicrobial resistance in the environment and its relevance to environmental regulators</article-title>. <source>Front. Microbiol.</source> <volume>7</volume>, <fpage>1728</fpage>. <pub-id pub-id-type="doi">10.3389/fmicb.2016.01728</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sitkiewicz</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Mereghetti</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Musser</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Lateral gene transfer of streptococcal ICE element RD2 (region of difference 2) encoding secreted proteins</article-title>. <source>BMC Microbiol.</source> <volume>11</volume> (<issue>1</issue>), <fpage>65</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2180-11-65</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Parker</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Identification of a circular intermediate in the transfer and transposition of Tn4555, a mobilizable transposon from Bacteroides spp</article-title>. <source>J. Bacteriol.</source> <volume>175</volume> (<issue>9</issue>), <fpage>2682</fpage>&#x2013;<lpage>2691</lpage>. <pub-id pub-id-type="doi">10.1128/jb.175.9.2682-2691.1993</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smyth</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Shera</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Bauer</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Cameron</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>McNeilly</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Sriprakash</surname>
<given-names>K. S.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Conjugative transfer of ICE Sde 3396 between three <italic>&#x3b2;</italic>-hemolytic streptococcal species</article-title>. <source>BMC Res. Notes</source> <volume>7</volume> (<issue>1</issue>), <fpage>521</fpage>. <pub-id pub-id-type="doi">10.1186/1756-0500-7-521</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smyth</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Integrative and sequence characteristics of a novel genetic element, ICE6013, in <italic>Staphylococcus aureus</italic>
</article-title>. <source>J. Bacteriol.</source> <volume>191</volume> (<issue>19</issue>), <fpage>5964</fpage>&#x2013;<lpage>5975</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00352-09</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Shoemaker</surname>
<given-names>N. B.</given-names>
</name>
<name>
<surname>Gardner</surname>
<given-names>J. F.</given-names>
</name>
<name>
<surname>Salyers</surname>
<given-names>A. A.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Integration site selection by the Bacteroides conjugative transposon CTnBST</article-title>. <source>J. Bacteriol.</source> <volume>189</volume> (<issue>18</issue>), <fpage>6594</fpage>&#x2013;<lpage>6601</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00668-07</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Springael</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Kreps</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mergeay</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Identification of a catabolic transposon, Tn4371, carrying biphenyl and 4-chlorobiphenyl degradation genes in Alcaligenes eutrophus A5</article-title>. <source>J. Bacteriol.</source> <volume>175</volume> (<issue>6</issue>), <fpage>1674</fpage>&#x2013;<lpage>1681</lpage>. <pub-id pub-id-type="doi">10.1128/jb.175.6.1674-1681.1993</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Street</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Harley</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Stern</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Larkin</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Miller</surname>
<given-names>D. L.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>Subdomain organization and catalytic residues of the F factor TraI relaxase domain</article-title>. <source>Biochim. Biophys. Acta</source> <volume>1646</volume> (<issue>1-2</issue>), <fpage>86</fpage>&#x2013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.1016/s1570-9639(02)00553-8</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Clewell</surname>
<given-names>D. B.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Characterization of the tet (M) determinant of Tn916: Evidence for regulation by transcription attenuation</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>36</volume> (<issue>4</issue>), <fpage>769</fpage>&#x2013;<lpage>778</lpage>. <pub-id pub-id-type="doi">10.1128/aac.36.4.769</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sugawara</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shumway</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>The sequence read archive</article-title>. <source>Nucleic Acids Res.</source> <volume>39</volume> (<issue>1</issue>), <fpage>D19</fpage>&#x2013;<lpage>D21</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkq1019</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uhlemann</surname>
<given-names>A. C. L.</given-names>
</name>
<name>
<surname>Aj Prensky</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Gomez-Simmonds</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Conjugation dynamics depend on both the plasmid acquisition cost and the fitness cost</article-title>. <source>Mol. Syst. Biol.</source> <volume>17</volume>, <fpage>e9913</fpage>. <pub-id pub-id-type="doi">10.15252/msb.20209913</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waldor</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Beaber</surname>
<given-names>J. W.</given-names>
</name>
<name>
<surname>Hochhut</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>SOS response promotes horizontal dissemination of antibiotic resistance genes</article-title>. <source>Nature</source> <volume>427</volume>, <fpage>72</fpage>&#x2013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1038/nature02241</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>van Dorp</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Shaw</surname>
<given-names>L. P.</given-names>
</name>
<name>
<surname>Bradley</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>The global distribution and spread of the mobilized colistin resistance gene mcr-1</article-title>. <source>Nat. Commun.</source> <volume>9</volume> (<issue>1</issue>), <fpage>1179</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-018-03205-z</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Waskom</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Botvinnik</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Hobson</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Warmenhoven</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cole</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Halchenko</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Seaborn: V0. 6.0 (June 2015)</article-title>. <source>Zenodo</source>. <pub-id pub-id-type="doi">10.5281/zenodo.19108</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wiedenbeck</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cohan</surname>
<given-names>F. M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Origins of bacterial diversity through horizontal genetic transfer and adaptation to new ecological niches</article-title>. <source>FEMS Microbiol. Rev.</source> <volume>35</volume> (<issue>5</issue>), <fpage>957</fpage>&#x2013;<lpage>976</lpage>. <pub-id pub-id-type="doi">10.1111/j.1574-6976.2011.00292.x</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wozniak</surname>
<given-names>R. A. F.</given-names>
</name>
<name>
<surname>Waldor</surname>
<given-names>M. K.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Integrative and conjugative elements: Mosaic mobile genetic elements enabling dynamic lateral gene flow</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>8</volume> (<issue>8</issue>), <fpage>552</fpage>&#x2013;<lpage>563</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro2382</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>