<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2022.923105</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Homology-based reconstruction of regulatory networks for bacterial and archaeal genomes</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author"><name><surname>Romero</surname><given-names>Luis</given-names></name>
<xref ref-type="author-notes" rid="fn012"><sup>&#x02020;</sup></xref>
<xref rid="aff1" ref-type="aff"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author"><name><surname>Contreras-Riquelme</surname><given-names>Sebastian</given-names></name>
<xref ref-type="author-notes" rid="fn013"><sup>&#x02020;</sup></xref>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/735594/overview"/>
</contrib>
<contrib contrib-type="author"><name><surname>Lira</surname><given-names>Manuel</given-names></name>
<xref rid="aff3" ref-type="aff"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Martin</surname><given-names>Alberto J. M.</given-names></name>
<xref ref-type="author-notes" rid="fn014"><sup>&#x02020;</sup></xref>
<xref rid="aff2" ref-type="aff"><sup>2</sup></xref>
<xref rid="c002" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/592883/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes"><name><surname>Perez-Rueda</surname><given-names>Ernesto</given-names></name>
<xref rid="aff4" ref-type="aff"><sup>4</sup></xref>
<xref rid="c001" ref-type="corresp"><sup>&#x002A;</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/681131/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Licenciatura en Ciencias Genomicas, Universidad Nacional Autonoma de Mexico</institution>, <addr-line>Cuernavaca</addr-line>, <country>Mexico</country></aff>
<aff id="aff2"><sup>2</sup><institution>Laboratorio de Biolog&#x00ED;a de Redes, Centro de Gen&#x00F3;mica y Bioinform&#x00E1;tica, Facultad Ciencias, Ingenier&#x00ED;a y Tecnolog&#x00ED;a, Universidad Mayor</institution>, <addr-line>Santiago</addr-line>, <country>Chile</country></aff>
<aff id="aff3"><sup>3</sup><institution>C&#x00F3;mputo Acad&#x00E9;mico, Facultad de Ciencias - UMDI-Sisal, Sede Parque Cient&#x00ED;fico y Tecnol&#x00F3;gico de Yucat&#x00E1;n, Universidad Nacional Aut&#x00F3;noma de M&#x00E9;xico</institution>, <addr-line>M&#x00E9;rida</addr-line>, <country>Mexico</country></aff>
<aff id="aff4"><sup>4</sup><institution>Instituto de Investigaciones en Matem&#x00E1;ticas Aplicadas y en Sistemas, Universidad Nacional Aut&#x00F3;noma de M&#x00E9;xico, Unidad Acad&#x00E9;mica Yucat&#x00E1;n</institution>, <addr-line>M&#x00E9;rida</addr-line>, <country>Mexico</country></aff>
<author-notes>
<fn id="fn0001" fn-type="edited-by">
<p>Edited by: Emilio M. Ungerfeld, Instituto de Investigaciones Agropecuarias, Chile</p>
</fn>
<fn id="fn0002" fn-type="edited-by">
<p>Reviewed by: Ilya R. Akberdin, Biosoft.ru, Russia; Shogo Ozaki, Kyushu University, Japan; Matthew Shepherd, University of Bath, United Kingdom</p>
</fn>
<corresp id="c001">&#x002A;Correspondence: Ernesto Perez-Rueda, <email>ernesto.perez@iimas.unam.mx</email></corresp>
<corresp id="c002">Alberto J. M. Martin, <email>alberto.martin@umayor.cl</email></corresp>
<fn fn-type="equal" id="fn012"><p>&#x02020;ORCID: Luis Romero, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0003-2102-5373">https://orcid.org/0000-0003-2102-5373</ext-link></p></fn>
<fn fn-type="equal" id="fn013"><p>Sebastian Contreras-Riquelme, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0002-4384-3580">https://orcid.org/0000-0002-4384-3580</ext-link></p></fn>
<fn fn-type="equal" id="fn014"><p>Alberto J. M. Martin, <ext-link ext-link-type="uri" xlink:href="https://orcid.org/0000-0002-6147-3325">https://orcid.org/0000-0002-6147-3325</ext-link></p></fn>
<fn id="fn0003" fn-type="other">
<p>This article was submitted to Systems Microbiology, a section of the journal Frontiers in Microbiology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>07</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>923105</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>04</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>27</day>
<month>06</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2022 Romero, Contreras-Riquelme, Lira, Martin and Perez-Rueda.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Romero, Contreras-Riquelme, Lira, Martin and Perez-Rueda</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Gene regulation is a key process for all microorganisms, as it allows them to adapt to different environmental stimuli. However, despite the relevance of gene expression control, for only a handful of organisms is there related information about genome regulation. In this work, we inferred the gene regulatory networks (GRNs) of bacterial and archaeal genomes by comparisons with six organisms with well-known regulatory interactions. The references we used are: <italic>Escherichia coli</italic> K-12 MG1655, <italic>Bacillus subtilis</italic> 168, <italic>Mycobacterium tuberculosis</italic>, <italic>Pseudomonas aeruginosa</italic> PAO1, <italic>Salmonella enterica</italic> subsp. <italic>enterica</italic> serovar <italic>typhimurium</italic> LT2, and <italic>Staphylococcus aureus</italic> N315. To this end, the inferences were achieved in two steps. First, the six model organisms were contrasted in an all-<italic>vs</italic>-all comparison of known interactions based on Transcription Factor (TF)-Target Gene (TG) orthology relationships and Transcription Unit (TU) assignments. In the second step, we used a guilt-by-association approach to infer the GRNs for 12,230 bacterial and 649 archaeal genomes based on TF-TG orthology relationships of the six bacterial models determined in the first step. Finally, we discuss examples to show the most relevant results obtained from these inferences. A web server with all the predicted GRNs is available at <ext-link ext-link-type="uri" xlink:href="https://regulatorynetworks.unam.mx/">https://regulatorynetworks.unam.mx/</ext-link> or <ext-link ext-link-type="uri" xlink:href="http://132.247.46.6/">http://132.247.46.6/</ext-link>.</p>
</abstract>
<kwd-group>
<kwd>regulatory networks</kwd>
<kwd>orthology</kwd>
<kwd>transcription units</kwd>
<kwd>regulatory modules</kwd>
<kwd>genomics</kwd>
</kwd-group>
<contract-num rid="cn1">(IN-209620</contract-num>
<contract-num rid="cn2">320012</contract-num>
<contract-sponsor id="cn1">Universidad Nacional Aut&#x00F3;noma de M&#x00E9;xico<named-content content-type="fundref-id">10.13039/501100005739</named-content></contract-sponsor>
<contract-sponsor id="cn2">CONACYT</contract-sponsor>
<counts>
<fig-count count="2"/>
<table-count count="4"/>
<equation-count count="3"/>
<ref-count count="48"/>
<page-count count="9"/>
<word-count count="6706"/>
</counts>
</article-meta>
</front>
<body>
<sec id="sec1" sec-type="intro">
<title>Introduction</title>
<p>Bacterial and archaeal organisms respond to diverse stimuli <italic>via</italic> the subtle mechanism of regulation of gene expression at the transcriptional level, and this involves DNA-binding proteins known as transcription factors (TFs). These proteins act by interacting with specific sites, usually upstream of the transcription start site, inducing or blocking access of the RNA polymerase to the promoter. In general, when a TF binds at a site that overlaps the promoter region of a gene, the system is repressed; when the binding site is upstream of the promoter, the system is activated (<xref ref-type="bibr" rid="ref4">Browning and Busby, 2016</xref>). In addition, this regulatory system is coordinated with the sensing of endogenous or exogenous stimuli by these regulatory proteins, i.e., they have the ability to sense diverse conditions for the cell to contend against environmental changes. For instance, in the bacterium <italic>Escherichia coli</italic> K-12, approximately three-quarters of TFs respond directly to extracellular signals through phosphorylation and binding to small molecules, such as allolactose or maltose (<xref ref-type="bibr" rid="ref1">Balderas-Mart&#x00ED;nez et al., 2013</xref>).</p>
<p>In this context, the regulatory system can be conceptualized as a circuit, where one TF can regulate multiple Target Genes (TGs) and multiple genes can be regulated by one or diverse TFs, all of them assembled into a gene regulatory network (GRN). In GRNs, nodes represent genes and the connections between them indicate that the TF-encoding gene regulates another gene; this type of network can be represented by directed graphs (<xref ref-type="bibr" rid="ref17">Karlebach and Shamir, 2008</xref>).</p>
<p>To date, GRNs have been determined for only a few bacterial models from three different phyla: Proteobacteria, including <italic>Escherichia coli</italic> K-12, <italic>Salmonella enterica</italic> subsp<italic>. enterica</italic> serovar <italic>typhimurium</italic> LT2, and <italic>Pseudomonas aeruginosa</italic> PAO1; Firmicutes, including <italic>Bacillus subtilis</italic> 168 and <italic>Staphylococcus aureus</italic> N315; and Actinobacteria, including <italic>Mycobacterium tuberculosis</italic>. The lack of GRNs for most microorganisms is due to the fact that reconstruction depends largely on experimental data. Therefore, the inference or expansion of regulatory relationships between TFs and their TGs in organisms beyond the bacterial models will allow us to understand diverse biological processes, such as cell growth, response to environmental changes, or cell division, among others.</p>
<p>In this regard, various approaches have been explored to reconstruct regulatory networks in bacteria, such as RegPrecise (<xref ref-type="bibr" rid="ref29">Novichkov et al., 2010</xref>), with a large amount of information available for regulons of diverse organisms, or the work of <xref ref-type="bibr" rid="ref5">Castro-Melchor et al. (2010)</xref> based on the transcript and functional similarities to infer regulatory networks in <italic>Streptomyces coelicolor</italic>, among others. However, the main limitations of these reconstructions are associated with the experimental information data.</p>
<p>Hence, to determine the GRNs in bacterial and archaeal genomes with no information on their regulatory interactions, we mapped orthologous interactions among the six bacterial models to identify novel TF-TG interactions. Next, we used a guilt-by-association approach to infer the GRNs for 12,230 bacterial and 649 archaeal genomes, based on TF-TG orthology relationships of six bacterial species with well-known regulatory interactions and Transcription Unit (TU) assignments (i.e., operonic organization). The &#x201C;guilt-by-association&#x201D; principle has been applied to deduce functional relationships (<xref ref-type="bibr" rid="ref30">Oliver, 2000</xref>), and used to predict gene function in various types of biological networks, for example in virulence factors of the bacterial pathogen, <italic>Aeromonas veronii</italic> (<xref ref-type="bibr" rid="ref21">Li et al., 2021</xref>). The reconstructed networks were evaluated in terms of their topological properties, identifying TFs as hubs, modules, and co-regulated genes. Thus, our approach allowed us to confer a degree of accuracy regarding the existence of each inferred interaction. Therefore, the predicted interactions must be considered as a starting point to further exploration, both <italic>in silico</italic> and experimentally. We suggest that posterior analysis must consider the identification of DNA-binding sites upstream the probable regulated gene or a functional analysis with Gene Ontology and global expression profiles, as it has been already suggested in other cellular systems beyond bacteria and archaea (<xref ref-type="bibr" rid="ref6">Chen, 2017</xref>). Finally, a web server with all the predicted GRNs is available to the scientific community at <ext-link xlink:href="https://regulatorynetworks.unam.mx/" ext-link-type="uri">https://regulatorynetworks.unam.mx/</ext-link> or <ext-link xlink:href="http://132.247.46.6/" ext-link-type="uri">http://132.247.46.6/</ext-link>.</p>
</sec>
<sec id="sec2">
<title>Data and methodology</title>
<sec id="sec3">
<title>Genomes used for reference</title>
<p>The information for six bacterial genomes used in this work was downloaded from either the NCBI server or RegulonDB: <italic>E. coli</italic> K-12 MG1655 (NC_000913.3, GCF_000005845.2), <italic>B. subtilis</italic> 168 (GCF_000009045.1), <italic>P. aeruginosa</italic> PAO1 (GCF_000006765.1), <italic>S. typhimurium</italic> LT2 (GCF_000006945.2), <italic>S. aureus</italic> N315 (GCF_000009645.1), and <italic>M. tuberculosis</italic> (GCF_000195955.2). For each genome, the FASTA sequence was obtained from the &#x201C;gbff/gbk&#x201D; files parsed with an <italic>ad hoc</italic> program (<xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>, ParserGBK.py), to add the appropriate label in the header: NCBI gene ID, local gene ID, gene name, product description, and organism name. Sequences with missing information were annotated as &#x201C;NODATA.&#x201D; In addition, the 12,230 genomes of bacteria and 649 archaeal genomes were downloaded from the NCBI RefSeq genome database on May 18, 2021, to infer their GRNs.</p>
</sec>
<sec id="sec4">
<title>Gene regulatory interactions</title>
<p>The regulatory interactions were obtained from specialized databases [DBTBS for <italic>B. subtilis</italic> release 5 (<xref ref-type="bibr" rid="ref42">Sierro et al., 2008</xref>),<xref rid="fn0004" ref-type="fn"><sup>1</sup></xref> RegulonDB release 10.9 for <italic>E. coli</italic> (<xref ref-type="bibr" rid="ref37">Santos-Zavaleta et al., 2019a</xref>),<xref rid="fn0005" ref-type="fn"><sup>2</sup></xref> <italic>M. tuberculosis</italic> (<xref ref-type="bibr" rid="ref16">Kapopoulou et al., 2011</xref>; <xref ref-type="bibr" rid="ref39">Sanz et al., 2011</xref>), RegulomePA release 1.0 for <italic>P. aeruginosa</italic>,<xref rid="fn0006" ref-type="fn"><sup>3</sup></xref> Salmonet release 2.0 for <italic>S. typhimurium</italic> LT2 (<xref ref-type="bibr" rid="ref25">M&#x00E9;tris et al., 2017</xref>), and for <italic>S. aureus</italic> N315 (<xref ref-type="bibr" rid="ref36">Ravcheev et al., 2011</xref>; <xref ref-type="bibr" rid="ref35">Poudel et al., 2020</xref>)] and posteriorly homogenized, following the same format: First column corresponds to the assigned number by regulatory interaction per organism; second column, TF associated; third column, Target gene; and the other columns indicate the annotations derived from the original networks (<xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>). These GRNs are summarized in <xref rid="tab1" ref-type="table">Table 1</xref>.</p>
<table-wrap position="float" id="tab1">
<label>Table 1</label>
<caption>
<p>Total new interactions per organism.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="middle">Contribution source &#x2192;</th>
<th align="center" valign="middle" rowspan="2"><italic>B. subtilis 168</italic></th>
<th align="center" valign="middle" rowspan="2"><italic>E. coli K-12</italic></th>
<th align="center" valign="middle" rowspan="2"><italic>P. aeruginosa PA01</italic></th>
<th align="center" valign="middle" rowspan="2"><italic>S. typhimurium LT2</italic></th>
<th align="center" valign="middle" rowspan="2"><italic>S. aureus N315</italic></th>
<th align="center" valign="middle" rowspan="2"><italic>M. tuberculosis H37Rv</italic></th>
<th align="center" valign="middle" rowspan="2">TUs</th>
<th align="center" valign="middle" rowspan="2">New interactions</th>
</tr>
<tr>
<th align="left" valign="middle">Network contributed &#x2193;</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top"><italic>B. subtilis 168</italic> (2738)</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">395<break/>(21.69%)</td>
<td align="center" valign="top">34<break/>(1.86%)</td>
<td align="center" valign="top">255<break/>(14.00%)</td>
<td align="center" valign="top">206<break/>(11.31%)</td>
<td align="center" valign="top">286 (15.70%)</td>
<td align="center" valign="top">828<break/>(45.46%)</td>
<td align="center" valign="top">1821</td>
</tr>
<tr>
<td align="left" valign="top"><italic>E. coli K-12</italic> (3616)</td>
<td align="center" valign="top">248<break/>(14.79%)</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">157<break/>(9.36%)</td>
<td align="center" valign="top">600<break/>(35.79%)</td>
<td align="center" valign="top">125<break/>(7.45%)</td>
<td align="center" valign="top">193 (11.51%)</td>
<td align="center" valign="top">393<break/>(23.62%)</td>
<td align="center" valign="top">1,676</td>
</tr>
<tr>
<td align="left" valign="top"><italic>P. aeruginosa PA01</italic> (998)</td>
<td align="center" valign="top">139<break/>(5.56%)</td>
<td align="center" valign="top">1,117 (44.69%)</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">709<break/>(28.37%)</td>
<td align="center" valign="top">92<break/>(3.68%)</td>
<td align="center" valign="top">331 (13.24%)</td>
<td align="center" valign="top">679<break/>(27.17%)</td>
<td align="center" valign="top">2,499</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. typhimurium LT2</italic> (2969)</td>
<td align="center" valign="top">259<break/>(10.71%)</td>
<td align="center" valign="top">1,135 (46.95%)</td>
<td align="center" valign="top">140<break/>(5.79%)</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">124<break/>(5.13%)</td>
<td align="center" valign="top">238 (9.84%)</td>
<td align="center" valign="top">608<break/>(25.15%)</td>
<td align="center" valign="top">2,417</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. aureus N315</italic> (709)</td>
<td align="center" valign="top">355<break/>(43.88%)</td>
<td align="center" valign="top">173 (21.38%)</td>
<td align="center" valign="top">8<break/>(0.98%)</td>
<td align="center" valign="top">109<break/>(13.47%)</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">79<break/>(9.76%)</td>
<td align="center" valign="top">177<break/>(21.87%)</td>
<td align="center" valign="top">809</td>
</tr>
<tr>
<td align="left" valign="top"><italic>M. tuberculosis H37Rv</italic> (2637)</td>
<td align="center" valign="top">70<break/>(9.02%)</td>
<td align="center" valign="top">242 (31.18%)</td>
<td align="center" valign="top">17<break/>(2.19%)</td>
<td align="center" valign="top">140<break/>(18.04%)</td>
<td align="center" valign="top">22<break/>(2.83%)</td>
<td align="center" valign="top">&#x2013;</td>
<td align="center" valign="top">405<break/>(52.19%)</td>
<td align="center" valign="top">776</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>The number of interactions, the contribution percentage of each organism (row &#x201C;contribution&#x201D;) to the new interactions, and the extension by TU assignment, is indicated. The number of interactions in the original network is indicated in brackets (first column).</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec id="sec5">
<title>Ortholog identification</title>
<p>The protein sequences from each model organism were used as reference to identify the orthologs in an all-<italic>vs</italic>-all genomes fashion using the program Proteinortho (<xref ref-type="bibr" rid="ref19">Lechner et al., 2011</xref>) with the following parameters: E-value &#x2264;10<sup>5</sup>, coverage &#x2265;70%, and identity of &#x2265;25%, as previously described for the identification of TFs (<xref ref-type="bibr" rid="ref9">Flores-Bautista et al., 2020</xref>).</p>
</sec>
<sec id="sec6">
<title>Transcription units</title>
<p>The predictions of Transcription Units (TUs) or operons were obtained using the method described by <xref ref-type="bibr" rid="ref28">Moreno-Hagelsieb and Collado-Vides (2002)</xref>. In brief, the predictions were based on the transcription direction and the intergenic distance (shorter intergenic distances and in the same direction for genes in the same TU).</p>
</sec>
<sec id="sec7">
<title>Inference of GRNs</title>
<p>The reference genomes were used to scan the 12,230 bacterial and 649 archaeal genomes to identify their orthologs and map their interactions considering the following criteria: If the orthologs of the TF and its TG of the model organism were found in a new genome, the interaction was assigned using guilt by association. In a second step, predicted TUs were used to expand the TF-TG interactions as follows: If the first gene of the orthologous TG in an organism corresponded to the first gene in the TU, the other genes belonging to the TU were associated with the same TF. Finally, each network was integrated using all the ortholog assignments with the six reference GRNs. All the network interactions can be inferred by running the script <italic>pipeline.sh</italic>, provided as <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref> and <xref rid="fig1" ref-type="fig">Figure 1</xref>.</p>
<fig position="float" id="fig1">
<label>Figure 1</label>
<caption>
<p>Flux diagram showing the inference of the GRNs. Six bacterial models were used to infer the GRNs in 12,230 bacterial and 649 archaeal genomes. If the pair A (TF) &#x2013; B (TG) in a reference genome is identified (by orthology) in a new genome A&#x2032; (TF) &#x2013;B&#x2032; (TG), the interaction is assigned. In addition, if the TG identified in the new genome is the first one in the TU, the interaction is extended to the other gene(s). One interaction in a new genome can be derived from one or more bacterial models. Finally, the reconstructed networks were evaluated in terms of their topological properties.</p>
</caption>
<graphic xlink:href="fmicb-13-923105-g001.tif"/>
</fig>
</sec>
<sec id="sec8">
<title>Regulatory modules</title>
<p>The GRNs were analyzed by using Cytoscape (<xref ref-type="bibr" rid="ref41">Shannon et al., 2003</xref>; <xref ref-type="bibr" rid="ref31">Otasek et al., 2019</xref>) to obtain their degree, clustering coefficient, and other centrality metrics. Hubs were obtained by using networkX from python (<xref ref-type="bibr" rid="ref14">Hagberg et al., 2008</xref>). In addition, to identify transcriptional co-regulators and modules in a GRN, the CoReg software was used. In brief, CoReg calculates gene similarities based on the number of common neighbors of any two genes in the network (<xref ref-type="bibr" rid="ref44">Song et al., 2017</xref>).</p>
</sec>
<sec id="sec9">
<title>Web server</title>
<p>The GRNs inferred for all the bacterial and archaeal genomes are available through the web server at <ext-link xlink:href="https://regulatorynetworks.unam.mx/" ext-link-type="uri">https://regulatorynetworks.unam.mx/</ext-link>, which is built on HTML5, JQuery, and Php languages, while the data are stored in a MySQL database. For the data display, we use the Cytoscape JS (<xref ref-type="bibr" rid="ref10">Franz et al., 2016</xref>) framework due its capabilities to represent nodes and edges of the network with determined properties, allowing users to change forms, colors, and layer visualization of the network.</p>
</sec>
<sec id="sec10">
<title>Method performance and statistical analysis</title>
<p>GRNs were compared using two different approaches to establish the reliability of the approach, one based on the ability to recover edges and the second focusing on the ability to recover network motifs (<xref ref-type="bibr" rid="ref26">Milo et al., 2002</xref>) by comparing the six reference networks with networks for the same genomes generated using our approach.</p>
<p>First, based on the orthologous annotations made with Proteinortho, we created a GRN for each of the reference bacteria using a naming convention that ensures that genes that are orthologous among them share the same name in each of the six GRNs used as reference. Then, we created networks for each reference organism based on the regulations transferred from the other five GRNs, again using the consensus gene names. GRNs with consensus gene names were then compared, following two procedures implemented in LoTo (<xref ref-type="bibr" rid="ref22">Martin et al., 2017</xref>). We employed binary classification metrics to evaluate the similarities between pairs of GRNs as follows: Edges present in both compared networks are considered true positives (TPs), genes only present in one of the networks are false negatives (FNs) if they are only in the reference network, True Negatives (TNs) are the edges absent in both compared networks, and false positives (FPs) if they appear only in the network we compared with the reference. This edge-based approach is used to compare predicted GRNs versus reference networks, and it indicates overall network similarity (<xref ref-type="bibr" rid="ref46">The DREAM5 Consortium et al., 2012</xref>). The second approach relies on the presence or absence of the motifs defined by <xref ref-type="bibr" rid="ref26">Milo et al. (2002)</xref> that have been related to functional patterns in GRNs. Instead of considering TF-gene interactions, in this second approach, we considered TP motifs present in both compared networks, FN motifs are only found in the reference network, and FPs are only present in the network compared against the reference GRN.</p>
<p>LoTo calculates several metrics, but here we only focused on the most employed ones:</p>
<disp-formula id="E1">
<mml:math id="M1">
<mml:mrow>
<mml:mi mathvariant="normal">Precision</mml:mi>
<mml:mspace width="thickmathspace"/>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">TP</mml:mi>
<mml:mo>/</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="normal">TP</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="normal">FP</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="E2">
<mml:math id="M2">
<mml:mrow>
<mml:mi mathvariant="normal">Recall</mml:mi>
<mml:mspace width="thickmathspace"/>
<mml:mfenced>
<mml:mi mathvariant="normal">R</mml:mi>
</mml:mfenced>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">TP</mml:mi>
<mml:mo>/</mml:mo>
<mml:mfenced>
<mml:mrow>
<mml:mi mathvariant="normal">TP</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="normal">FN</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>
<p>and</p>
<disp-formula id="E3">
<mml:math id="M3">
<mml:mrow>
<mml:mi mathvariant="normal">F1</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="normal">2PR</mml:mi>
<mml:mo>/</mml:mo>
<mml:mfenced>
<mml:mrow>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi mathvariant="normal">R</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:math>
</disp-formula>
<p>To establish a baseline and determine whether the results from our approach are significant versus what can be expected by chance, we also created a protocol to determine the expectancy of a transferred TF-gene regulation by chance. We randomized the names TFs for the whole inferred networks 10,000 times to calculate expected TP, FP, TN, and FN values by comparing these randomized networks against their reference counterparts. This protocol ensures comparisons of random networks with the same characteristics, e.g., edges, TFs, and genes, against their actual reference. We then employed a G-test as implemented in SciPy (<xref ref-type="bibr" rid="ref47">Virtanen et al., 2020</xref>) to determine whether the observed number of edges considered TP, FP, TN, and FN can be from the same distribution as that observed for the predicted networks without randomization.</p>
</sec>
</sec>
<sec id="sec11">
<title>Results and discussion</title>
<sec id="sec12">
<title>Identification of new interactions in bacterial models</title>
<p>In order to evaluate and expand the GRNs of the six model organisms, the number of TFs, TGs, and their interactions was determined. To do this, we downloaded six GRNs, and their interactions were displayed by using Cytoscape. In this work, we considered TFs as those proteins that activate or repress gene expression but do not belong to the transcriptional basal machinery; therefore, sigma factors, antiterminators, terminators, and sensor proteins, among other proteins, were excluded from the resulting data set (<xref ref-type="bibr" rid="ref23">Mart&#x00ED;nez-N&#x00FA;&#x00F1;ez et al., 2013</xref>). <xref rid="tab2" ref-type="table">Table 2</xref> shows the number of interactions associated with each organism. The most studied bacterial species, <italic>E. coli</italic> K-12, has 3,616 interactions based on experimental evidence, followed by <italic>S. typhimurium</italic> LT2 (2,969 interactions) and <italic>B. subtilis</italic> with 2738TF-TG interactions, whereas the GRN of <italic>S. aureus</italic> contains the smallest number of interactions, with 709. This difference could be a consequence of the experimental evidence accumulated over the years and the number of experiments carried out and performed with each organism; i.e., there is a bias inherent to the experimental analysis towards specific organisms. For instance, in a recent collection of 668 experimentally characterized TFs in bacteria and archaea organisms (<xref ref-type="bibr" rid="ref9">Flores-Bautista et al., 2020</xref>), 33.5% was associated with <italic>E. coli K12,</italic> 23% with different strains of <italic>M. tuberculosis</italic>, and 19% with <italic>B. subtilis</italic> 168; i.e., 76% of the complete collection is concentrated in few organisms; in contrast, 24% of the collection is distributed among 78 different prokaryotes. This contrast in the information is also evident in more general databases, such as UniProtKB/Swiss-Prot, where <italic>E. coli K-12</italic> is the bacterial organism with more proteins deposited and curated manually in the database.<xref rid="fn0007" ref-type="fn"><sup>4</sup></xref></p>
<table-wrap position="float" id="tab2">
<label>Table 2</label>
<caption>
<p>Single edge comparisons between the six reference networks employed in this work and their counterparts generated following our homology-based transfer approach from the other remaining networks.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Organism</th>
<th align="center" valign="top">TP</th>
<th align="center" valign="top">FP</th>
<th align="center" valign="top">FN</th>
<th align="center" valign="top"><italic>R</italic></th>
<th align="center" valign="top"><italic>P</italic></th>
<th align="center" valign="top"><italic>F</italic>1</th>
<th align="center" valign="top"><italic>p</italic>-value</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top"><italic>B. subtilis 168</italic></td>
<td align="center" valign="top">254</td>
<td align="center" valign="top">499</td>
<td align="center" valign="top">2,447</td>
<td align="char" valign="top" char=".">0.094</td>
<td align="char" valign="top" char=".">0.3373</td>
<td align="char" valign="top" char=".">0.147</td>
<td align="char" valign="top" char=".">4.01e&#x2013;258</td>
</tr>
<tr>
<td align="left" valign="top"><italic>E. coli K-12</italic></td>
<td align="center" valign="top">1,538</td>
<td align="center" valign="top">709</td>
<td align="center" valign="top">1,971</td>
<td align="char" valign="top" char=".">0.4383</td>
<td align="char" valign="top" char=".">0.6845</td>
<td align="char" valign="top" char=".">0.5344</td>
<td align="char" valign="top" char=".">0.0</td>
</tr>
<tr>
<td align="left" valign="top"><italic>P. aeruginosa PA01</italic></td>
<td align="center" valign="top">51</td>
<td align="center" valign="top">202</td>
<td align="center" valign="top">938</td>
<td align="char" valign="top" char=".">0.0516</td>
<td align="char" valign="top" char=".">0.2016</td>
<td align="char" valign="top" char=".">0.0822</td>
<td align="char" valign="top" char=".">9.46e&#x2013;39</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. typhimurium LT2</italic></td>
<td align="center" valign="top">1,491</td>
<td align="center" valign="top">666</td>
<td align="center" valign="top">1,394</td>
<td align="char" valign="top" char=".">0.5168</td>
<td align="char" valign="top" char=".">0.6912</td>
<td align="char" valign="top" char=".">0.5914</td>
<td align="char" valign="top" char=".">0.0</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. aureus N315</italic></td>
<td align="center" valign="top">229</td>
<td align="center" valign="top">237</td>
<td align="center" valign="top">466</td>
<td align="char" valign="top" char=".">0.3295</td>
<td align="char" valign="top" char=".">0.4914</td>
<td align="char" valign="top" char=".">0.3945</td>
<td align="char" valign="top" char=".">9.45e&#x2013;229</td>
</tr>
<tr>
<td align="left" valign="top"><italic>M. tuberculosis H37Rv</italic></td>
<td align="center" valign="top">71</td>
<td align="center" valign="top">138</td>
<td align="center" valign="top">2,494</td>
<td align="char" valign="top" char=".">0.0277</td>
<td align="char" valign="top" char=".">0.3397</td>
<td align="char" valign="top" char=".">0.0512</td>
<td align="char" valign="top" char=".">5.99e&#x2013;52</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Precision (P), Recall (R), and F1 were calculated using the true positive (TP), false positive (FP), and false negative edges (FN). P-value of the G-test indicates the significance of the differences between the averaged counts of TP, FP, TN, and FN in the 10,000 randomizations of the inferred networks and the results shown in the table.</p>
</table-wrap-foot>
</table-wrap>
<p>To determine the number of interactions shared between the six model organisms, we first used the program Proteinortho to assign orthology relationships between all proteins in the proteome of each bacterium. Once orthologous proteins were determined, we inferred regulatory interactions between organisms based on the presence of an orthologous TF and an orthologous target of that TF in the model GRN. In the second step, the interactions were expanded by using the TU assignments, as described in Materials and Methods. This comparison showed that <italic>E. coli</italic> and <italic>S. typhimurium</italic> LT2 share a high number of interactions, because of their phylogenetic closeness. In contrast, the actinobacterium <italic>M. tuberculosis</italic> is the organism with the lowest number of shared interactions with the other bacterial models as a consequence of its phylogenetic distance; only 12% (in average) of its interactions are shared with other bacteria (see <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>).</p>
<p>In order to infer new interactions among the six bacterial genomes, they were compared and their interactions were assigned based on the presence of the TF-TG orthologous pairs. In this regard, <xref rid="tab1" ref-type="table">Table 1</xref> shows the number of new assignments and their proportion per organism. From this analysis, we found between 776 and 2,499 new interactions, with <italic>S. typhimurium</italic> LT2 and <italic>P. aeruginosa</italic> the organisms determined to have more new interactions inferred. These larger numbers for <italic>S. typhimurium</italic> LT2 and <italic>P. aeruginosa</italic> are probably a consequence of their phylogenetic closeness with <italic>E. coli</italic> K-12 (<xref ref-type="bibr" rid="ref11">Fukushima et al., 2002</xref>) in comparison to the other organisms used as models. It is important that some regulatory interactions were found in more than one organism; therefore, the sum of the rows may not correspond to the total number of new interactions, as is the case for the regulator PhoB (NP_414933.1) of <italic>E. coli</italic> K-12, which regulates the cytochrome bd-I ubiquinol oxidase subunit (NP_415262.1), as inferred from the interactions previously described in the <italic>B. subtilis</italic> and <italic>M. tuberculosis</italic> networks.</p>
</sec>
<sec id="sec13">
<title>Performance estimation of the approach</title>
<p>Regarding the reliability of interactions predicted by our approach, we compared networks with only TF-TG interactions derived from homology relationships for each of the six species with the respective reference GRNs. The comparisons were made by considering this to be a binary classification problem, and thus, edges (and graphlets) in both the reference network and the predicted GRN are TPs, edges only in the reference are FNs, and edges only in the predicted network are FPs. These results, shown in <xref rid="tab2" ref-type="table">Table 2</xref> for single edges and in <xref rid="tab3" ref-type="table">Table 3</xref> for graphlets, indicate a varying range of values depending on the compared bacteria. For recall (R), the rate of recovered TF-TG interactions ranged from 0.028 for <italic>M. tuberculosis</italic> to 0.52 for <italic>S. enterica</italic>, whereas precision (P), which indicates the likelihood that the existence of an edge is correctly predicted, ranged from 0.20 for <italic>P. aeruginosa</italic> to 0.69 for <italic>S. enterica</italic>. These results are significantly different from those expected by chance, as shown by the very low <italic>p</italic>-values obtained with the G-test. When the same metrics for the presence and absence of graphlets were used (<xref rid="tab3" ref-type="table">Table 3</xref>), we found a similar trend for each model GRN but with lower values for each metric. Lower values for the metrics calculated with graphlets are expected, since a single edge that differs between two networks often affects various graphlets.</p>
<table-wrap position="float" id="tab3">
<label>Table 3</label>
<caption>
<p>Graphlets absence comparison between the six reference networks employed in this work and their counterparts generated following our homology-based transfer approach from the other remaining networks.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top">Organism</th>
<th align="center" valign="top">TP</th>
<th align="center" valign="top">FP</th>
<th align="center" valign="top">TN</th>
<th align="center" valign="top">FN</th>
<th align="center" valign="top"><italic>R</italic></th>
<th align="center" valign="top"><italic>P</italic></th>
<th align="center" valign="top"><italic>F</italic>1</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top"><italic>B. subtilis 168</italic></td>
<td align="center" valign="top">2,241</td>
<td align="center" valign="top">10,008</td>
<td align="center" valign="top">622,878,341</td>
<td align="center" valign="top">145,210</td>
<td align="char" valign="top" char=".">0.0152</td>
<td align="char" valign="top" char=".">0.183</td>
<td align="char" valign="top" char=".">0.0281</td>
</tr>
<tr>
<td align="left" valign="top"><italic>E. coli K-12</italic></td>
<td align="center" valign="top">57,366</td>
<td align="center" valign="top">38,545</td>
<td align="center" valign="top">619,477,397</td>
<td align="center" valign="top">185,907</td>
<td align="char" valign="top" char=".">0.2358</td>
<td align="char" valign="top" char=".">0.5981</td>
<td align="char" valign="top" char=".">0.3383</td>
</tr>
<tr>
<td align="left" valign="top"><italic>P. aeruginosa PA01</italic></td>
<td align="center" valign="top">101</td>
<td align="center" valign="top">2,815</td>
<td align="center" valign="top">73,261,825</td>
<td align="center" valign="top">12,989</td>
<td align="char" valign="top" char=".">0.0077</td>
<td align="char" valign="top" char=".">0.0346</td>
<td align="char" valign="top" char=".">0.0126</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. typhimurium LT2</italic></td>
<td align="center" valign="top">56,206</td>
<td align="center" valign="top">50,622</td>
<td align="center" valign="top">362,053,161</td>
<td align="center" valign="top">134,678</td>
<td align="char" valign="top" char=".">0.2945</td>
<td align="char" valign="top" char=".">0.5261</td>
<td align="char" valign="top" char=".">0.3776</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. aureus N315</italic></td>
<td align="center" valign="top">2087</td>
<td align="center" valign="top">5,176</td>
<td align="center" valign="top">17,864,376</td>
<td align="center" valign="top">19,578</td>
<td align="char" valign="top" char=".">0.0963</td>
<td align="char" valign="top" char=".">0.2873</td>
<td align="char" valign="top" char=".">0.1443</td>
</tr>
<tr>
<td align="left" valign="top"><italic>M. tuberculosis H37Rv</italic></td>
<td align="center" valign="top">215</td>
<td align="center" valign="top">1876</td>
<td align="center" valign="top">117,513,083</td>
<td align="center" valign="top">234,607</td>
<td align="char" valign="top" char=".">0.0009</td>
<td align="char" valign="top" char=".">0.1028</td>
<td align="char" valign="top" char=".">0.0018</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="sec14">
<title>The expanded GRNs identified new TF-TG interactions</title>
<p>Based on the expanded networks, we identified new TF-TG interactions described in <xref rid="tab4" ref-type="table">Table 4</xref> that must be exhaustively analyzed. In this regard, we found an increase in the number of targets, TFs, nodes, and interactions for all the bacterial and archaeal extended networks. For instance, for <italic>M. tuberculosis</italic> H37Rv, there was an increase of 776 new interactions (305 new TGs and 31 new TFs), whereas for <italic>B. subtilis</italic>, 1821 new interactions (36 new TFs and 553 new TGs) were identified. Therefore, we performed a literature search to find evidence to support our predictions. Based on these searches, and considering the 1,676 new interactions for <italic>E. coli</italic> K-12 (56 new TFs and 570 new TGs), we identified that 179 of these interactions have been described in the literature (<xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>); however, they are not deposited in RegulonDB. In particular, we found that the interaction of SoxS and <italic>ompW</italic> in the GRN of <italic>E. coli</italic> and inferred from <italic>S. enterica</italic> has been experimentally described. In <italic>E. coli</italic>, <italic>ompW</italic> is regulated by three TFs, as described in RegulonDB; however, we found that it could be also regulated by SoxS (<xref ref-type="bibr" rid="ref49">Zhang et al., 2020</xref>) in a negative fashion.</p>
<table-wrap position="float" id="tab4">
<label>Table 4</label>
<caption>
<p>Comparisons between experimentally and inferred GRNs.</p>
</caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="middle">Organism</th>
<th align="center" valign="middle">Target counts</th>
<th align="center" valign="middle">Target counts extended _tu</th>
<th align="center" valign="middle">TF counts</th>
<th align="center" valign="middle">TF counts extended_tu</th>
<th align="center" valign="middle">Node count</th>
<th align="center" valign="middle">Node count extended _tu</th>
<th align="center" valign="middle">Edge count</th>
<th align="center" valign="middle">Edge count extended _tu</th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top"><italic>B. subtilis 168</italic></td>
<td align="center" valign="top">1748</td>
<td align="center" valign="top">2,301</td>
<td align="center" valign="top">191</td>
<td align="center" valign="top">227</td>
<td align="center" valign="top">1799</td>
<td align="center" valign="top">2,339</td>
<td align="center" valign="top">2,738</td>
<td align="center" valign="top">4,559</td>
</tr>
<tr>
<td align="left" valign="top"><italic>E. coli K-12</italic></td>
<td align="center" valign="top">1,618</td>
<td align="center" valign="top">2,188</td>
<td align="center" valign="top">196</td>
<td align="center" valign="top">252</td>
<td align="center" valign="top">1,670</td>
<td align="center" valign="top">2,224</td>
<td align="center" valign="top">3,616</td>
<td align="center" valign="top">5,292</td>
</tr>
<tr>
<td align="left" valign="top"><italic>P. aeruginosa PA01</italic></td>
<td align="center" valign="top">604</td>
<td align="center" valign="top">1701</td>
<td align="center" valign="top">124</td>
<td align="center" valign="top">236</td>
<td align="center" valign="top">638</td>
<td align="center" valign="top">1741</td>
<td align="center" valign="top">998</td>
<td align="center" valign="top">3,497</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. typhimurium LT2</italic></td>
<td align="center" valign="top">1,640</td>
<td align="center" valign="top">2,371</td>
<td align="center" valign="top">131</td>
<td align="center" valign="top">224</td>
<td align="center" valign="top">1,670</td>
<td align="center" valign="top">2,404</td>
<td align="center" valign="top">2,969</td>
<td align="center" valign="top">5,386</td>
</tr>
<tr>
<td align="left" valign="top"><italic>S. aureus N315</italic></td>
<td align="center" valign="top">584</td>
<td align="center" valign="top">973</td>
<td align="center" valign="top">51</td>
<td align="center" valign="top">101</td>
<td align="center" valign="top">598</td>
<td align="center" valign="top">990</td>
<td align="center" valign="top">709</td>
<td align="center" valign="top">1,518</td>
</tr>
<tr>
<td align="left" valign="top"><italic>M. tuberculosis H37Rv</italic></td>
<td align="center" valign="top">1,405</td>
<td align="center" valign="top">1710</td>
<td align="center" valign="top">76</td>
<td align="center" valign="top">107</td>
<td align="center" valign="top">1,431</td>
<td align="center" valign="top">1733</td>
<td align="center" valign="top">2,637</td>
<td align="center" valign="top">3,413</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p>Columns as are follows: Genome name; columns 1, 3, 5, and 7 indicate the Targets, TFs, nodes, and number of interactions identified in the original networks; columns 2, 4, 6, and 8 indicate the Targets, TFs, nodes, and number of interactions identified in the extended networks.</p>
</table-wrap-foot>
</table-wrap>
<p>We also found a new interaction, where CpxR could be regulating <italic>tar</italic> gene. This TF together CsgD has been described in bacterial adhesion, and belongs to the stationary-phase response (<xref ref-type="bibr" rid="ref38">Santos-Zavaleta et al., 2019b</xref>). Experimental evidence suggests that CpxR and CsgD repress the transcription of <italic>fliA</italic>, <italic>flgM</italic>, and <italic>tar</italic> (<xref ref-type="bibr" rid="ref8">Dudin et al., 2014</xref>), in addition to <italic>bglg</italic> and <italic>bglb</italic> (<xref ref-type="bibr" rid="ref24">Matt&#x00E9;otti et al., 2011</xref>), and PdhR and <italic>lipA</italic> (<xref ref-type="bibr" rid="ref15">Kaleta et al., 2010</xref>). These regulatory interactions identified by our orthologs inferences have not been documented in RegulonDB.</p>
</sec>
<sec id="sec15">
<title>Web server</title>
<p>The GRNs inferred in all the bacterial and archaeal genomes are available through a web server whose interface is shown in <xref rid="fig2" ref-type="fig">Figure 2</xref>. The GRN of user-selected organisms are shown in an embedded interactive display that through a very intuitive mouse-based interface allows the user to select subnetworks and different types of regulatory interactions. Edge and node colors can also be redefined, as well as the layout used in the network visualization, depending on their properties. Additionally, the user can display and visualize information related to Genes (name, protein ID, initial and end coordinates, and strand), and edges among nodes representing genes, including information about whether this is a new or known edge and the organism from which it was derived. Additionally, if information is available, by clicking on the node name or protein identifier, you can access the NCBI/Uniprot page related to the gene of interest.</p>
<fig position="float" id="fig2">
<label>Figure 2</label>
<caption>
<p>Online interface of the &#x201C;regulatory networks&#x201D; server storing the publicly available database. Diverse options are available for the user: a description of the system, a page to download the raw data, and the core section of the web to filter a GRN (purple box). To visualize load a network, the user can select the Gene Regulatory Network of the organism of interest in the &#x201C;load a network&#x201D; panel. In the Select network box, the user can <italic>Start</italic> selecting the name of the organism and click on the <italic>Load</italic> button to visualize the network on the right window (red box). This action will load the graph (black box) and node/edges properties (cyan box). Diverse layouts can be applied to visualize the network and specific nodes/edges to generate a new subgraph (green box) can be selected. As the graph visualization could be modified, the user can center/fit the network (White buttons) or reset the current visualization (Yellow button). Finally, for displayed nodes and edges, the user can download this network (Green button). In the example, in the right panel, the network is associated with the transcription factor DnaA (diamond) and their Target Genes (circles). Edges represent the transcription direction (when it is available). In the low panel, the TGs under the regulation of the TF are shown: NCBI ID, gene name, protein ID, start and end position, and strands. For more details of the web application, please refer to the <xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>.</p>
</caption>
<graphic xlink:href="fmicb-13-923105-g002.tif"/>
</fig>
<p>Entire GRNs or used defined subnetworks can be downloaded in standard format for further inspection with tools such as Cytoscape, that in addition, connect our tool to the whole array of apps already available for this visualization tool. For more information and a more detailed description of both the input and output files, see the website <ext-link xlink:href="https://regulatorynetworks.unam.mx/" ext-link-type="uri">https://regulatorynetworks.unam.mx/</ext-link> or <ext-link xlink:href="http://132.247.46.6/" ext-link-type="uri">http://132.247.46.6/</ext-link>, help section, where an example is provided.</p>
</sec>
</sec>
<sec id="sec16" sec-type="conclusions">
<title>Conclusion</title>
<p>In this work, we have expanded the GRNs for six model organisms, by considering orthologous inference and TU assignments. This inference is based on the assumption that orthologous TFs generally regulate the expression of orthologous TGs (<xref ref-type="bibr" rid="ref48">Yu et al., 2004</xref>; <xref ref-type="bibr" rid="ref12">Gal&#x00E1;n-V&#x00E1;squez et al., 2011</xref>; <xref ref-type="bibr" rid="ref20">Lenz et al., 2020</xref>; <xref ref-type="bibr" rid="ref43">Soberanes-Guti&#x00E9;rrez et al., 2021</xref>). The inferred interactions were included in the GRN, and their topological properties were calculated. In a second step, we inferred the GRNs for 12, 879 genomes, based on TF-TG orthology relationships of six bacterial species with well-known regulatory interactions and TU assignments. We discuss some examples to show the most relevant results obtained from this inference, and topological metrics are calculated for these networks. Therefore, our approach to reconstruct regulatory networks is a valuable resource of regulatory interactions occurring within bacteria and archaea cellular domains, and it may integrate with global expression data available for these organisms in order to improve global interaction data models. From an evolutionary perspective, the dynamics to expand or modify the repertoire of cellular functions that transcription factors control involves: (a) transcriptional rewiring whereby the promoters of orthologous genes in related species differ in the presence or absence of a binding site(s) for a conserved transcription factor(s); (b) embedding horizontally acquired genes under regulation of an ancestral transcription factor; (c) restructuring of the promoters controlled by a transcription factor; and (d) modifications in the transcription factors themselves (<xref ref-type="bibr" rid="ref32">Perez and Groisman, 2009</xref>; <xref ref-type="bibr" rid="ref34">P&#x00E9;rez-Rueda et al., 2009</xref>). In this context, the inference of archaeal GRNs was based under the hypothesis that bacteria and archaea share a common ancestry in terms of their TFs, with posterior divergence (<xref ref-type="bibr" rid="ref3">Bell and Jackson, 2001</xref>; <xref ref-type="bibr" rid="ref27">Minezaki et al., 2005</xref>), whereas the origin of the ancestral basal transcriptional machinery cannot be ascertained, and it could have been bacterial or archaeal&#x2013;eukaryal type. For instance, 53% of the total repertoire of archaeal TFs exhibit at least one homologue in bacterial genomes. In particular, archaea and clostridia share a common set of TFs classified in diverse evolutionary families (<xref ref-type="bibr" rid="ref18">Kyrpides and Woese, 1998</xref>; <xref ref-type="bibr" rid="ref2">Bell, 2005</xref>; <xref ref-type="bibr" rid="ref33">P&#x00E9;rez-Rueda and Janga, 2010</xref>), different to the families shared with several Actinobacteria and some Gammaproteobacteria. This reinforces the notion that TFs of bacteria and archaea share a common ancestry and highlight a close relationship between the TFs from archaea and Firmicutes. In addition, bacteria and archaea share an operonic organization (<xref ref-type="bibr" rid="ref40">Seitzer et al., 2020</xref>; <xref ref-type="bibr" rid="ref45">Sueda et al., 2021</xref>). Thus, the experimental information concerning GRN in archaea is limited. For instance, the GRN of <italic>Pyrococcus furiosus</italic> shows seven regulons and 279 genes, which represent 13.5% (279 genes) of the total genes in this archaeon (<xref ref-type="bibr" rid="ref7">Denis et al., 2018</xref>). Therefore, inferences of GRN are central to explore in detail the organisms included in this cellular domain.</p>
<p>Finally, we have provided readers with a website where all the networks can be analyzed and downloaded.</p>
</sec>
<sec id="sec17" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">Supplementary material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="sec18">
<title>Author contributions</title>
<p>All authors listed have made a substantial, direct, and intellectual contribution to the work and approved it for publication.</p>
</sec>
<sec id="sec19" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by Direcci&#x00F3;n General de Asuntos del Personal Acad&#x00E9;mico-Universidad Nacional Aut&#x00F3;noma de M&#x00E9;xico (IN-209620) and CONACYT (320012) and Agencia Nacional de Investigaci&#x00F3;n Cient&#x00ED;fica y Desarrollo (ANID) FONDECYT 1181089 awarded to AM. Powered@NLHPC: this research was partially supported by the supercomputing infrastructure of the NLHPC (ECM-02) and the computing infrastructure of the Centro de Gen&#x00F3;mica y Bioinform&#x00E1;tica, Universidad Mayor.</p>
</sec>
<sec id="conf1" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="sec100" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<p>We thank Israel Sanchez, Ana Cecilia Perez Arteaga, and Ramiro Chavez Tovar for their technical support.</p>
</ack>
<sec id="sec21" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary material for this article can be found online at: <ext-link xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2022.923105/full#supplementary-material" ext-link-type="uri">https://www.frontiersin.org/articles/10.3389/fmicb.2022.923105/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.ZIP" id="SM1" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.PDF" id="SM2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="ref1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Balderas-Mart&#x00ED;nez</surname> <given-names>Y. I.</given-names></name> <name><surname>Savageau</surname> <given-names>M.</given-names></name> <name><surname>Salgado</surname> <given-names>H.</given-names></name> <name><surname>P&#x00E9;rez-Rueda</surname> <given-names>E.</given-names></name> <name><surname>Morett</surname> <given-names>E.</given-names></name> <name><surname>Collado-Vides</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <article-title>Transcription factors in <italic>Escherichia coli</italic> prefer the holo conformation</article-title>. <source>PLoS One</source> <volume>8</volume>:<fpage>e65723</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0065723</pub-id>, PMID: <pub-id pub-id-type="pmid">23776535</pub-id></citation></ref>
<ref id="ref2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bell</surname> <given-names>S. D.</given-names></name></person-group> (<year>2005</year>). <article-title>Archaeal transcriptional regulation--variation on a bacterial theme?</article-title> <source>Trends Microbiol.</source> <volume>13</volume>, <fpage>262</fpage>&#x2013;<lpage>265</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tim.2005.03.015</pub-id></citation></ref>
<ref id="ref3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bell</surname> <given-names>S. D.</given-names></name> <name><surname>Jackson</surname> <given-names>S. P.</given-names></name></person-group> (<year>2001</year>). <article-title>Mechanism and regulation of transcription in archaea</article-title>. <source>Curr. Opin. Microbiol.</source> <volume>4</volume>, <fpage>208</fpage>&#x2013;<lpage>213</lpage>. doi: <pub-id pub-id-type="doi">10.1016/s1369-5274(00)00190-9</pub-id></citation></ref>
<ref id="ref4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Browning</surname> <given-names>D. F.</given-names></name> <name><surname>Busby</surname> <given-names>S. J.</given-names></name></person-group> (<year>2016</year>). <article-title>Local and global regulation of transcription initiation in bacteria</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>14</volume>, <fpage>638</fpage>&#x2013;<lpage>650</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrmicro.2016.103</pub-id>, PMID: <pub-id pub-id-type="pmid">27498839</pub-id></citation></ref>
<ref id="ref5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Castro-Melchor</surname> <given-names>M.</given-names></name> <name><surname>Charaniya</surname> <given-names>S.</given-names></name> <name><surname>Karypis</surname> <given-names>G.</given-names></name> <name><surname>Takano</surname> <given-names>E.</given-names></name> <name><surname>Hu</surname> <given-names>W. S.</given-names></name></person-group> (<year>2010</year>). <article-title>Genome-wide inference of regulatory networks in <italic>Streptomyces coelicolor</italic></article-title>. <source>BMC Genomics</source> <volume>11</volume>:<fpage>578</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2164-11-578</pub-id>, PMID: <pub-id pub-id-type="pmid">20955611</pub-id></citation></ref>
<ref id="ref6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>X.</given-names></name></person-group> (<year>2017</year>). <article-title>Prediction of optimal gene functions for osteosarcoma using network-based- guilt by association method based on gene oncology and microarray profile</article-title>. <source>J. Bone Oncol.</source> <volume>7</volume>, <fpage>18</fpage>&#x2013;<lpage>22</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jbo.2017.04.003</pub-id>, PMID: <pub-id pub-id-type="pmid">28443230</pub-id></citation></ref>
<ref id="ref7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Denis</surname> <given-names>A.</given-names></name> <name><surname>Mart&#x00ED;nez-N&#x00FA;&#x00F1;ez</surname> <given-names>M. A.</given-names></name> <name><surname>Tenorio-Salgado</surname> <given-names>S.</given-names></name> <name><surname>Perez-Rueda</surname> <given-names>E.</given-names></name></person-group> (<year>2018</year>). <article-title>Dissecting the Repertoire of DNA-Binding Transcription Factors of the Archaeon <italic>Pyrococcus furiosus</italic> DSM 3638</article-title>. <source>Life</source> <volume>8</volume>:<fpage>40</fpage>. doi: <pub-id pub-id-type="doi">10.3390/life8040040</pub-id>, PMID: <pub-id pub-id-type="pmid">30248960</pub-id></citation></ref>
<ref id="ref8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dudin</surname> <given-names>O.</given-names></name> <name><surname>Geiselmann</surname> <given-names>J.</given-names></name> <name><surname>Ogasawara</surname> <given-names>H.</given-names></name> <name><surname>Ishihama</surname> <given-names>A.</given-names></name> <name><surname>Lacour</surname> <given-names>S.</given-names></name></person-group> (<year>2014</year>). <article-title>Repression of flagellar genes in exponential phase by CsgD and CpxR, two crucial modulators of <italic>Escherichia coli</italic> biofilm formation</article-title>. <source>J. Bacteriol.</source> <volume>196</volume>, <fpage>707</fpage>&#x2013;<lpage>715</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JB.00938-13</pub-id>, PMID: <pub-id pub-id-type="pmid">24272779</pub-id></citation></ref>
<ref id="ref9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Flores-Bautista</surname> <given-names>E.</given-names></name> <name><surname>Hernandez-Guerrero</surname> <given-names>R.</given-names></name> <name><surname>Huerta-Saquero</surname> <given-names>A.</given-names></name> <name><surname>Tenorio-Salgado</surname> <given-names>S.</given-names></name> <name><surname>Rivera-Gomez</surname> <given-names>N.</given-names></name> <name><surname>Romero</surname> <given-names>A.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Deciphering the functional diversity of DNA-binding transcription factors in Bacteria and Archaea organisms</article-title>. <source>PLoS One</source> <volume>15</volume>:<fpage>e0237135</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0237135</pub-id>, PMID: <pub-id pub-id-type="pmid">32822422</pub-id></citation></ref>
<ref id="ref10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Franz</surname> <given-names>M.</given-names></name> <name><surname>Lopes</surname> <given-names>C. T.</given-names></name> <name><surname>Huck</surname> <given-names>G.</given-names></name> <name><surname>Dong</surname> <given-names>Y.</given-names></name> <name><surname>Sumer</surname> <given-names>O.</given-names></name> <name><surname>Bader</surname> <given-names>G. D.</given-names></name></person-group> (<year>2016</year>). <article-title>Cytoscape.js: a graph theory library for visualisation and analysis</article-title>. <source>Bioinformatics</source> <volume>32</volume>, <fpage>309</fpage>&#x2013;<lpage>311</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btv557</pub-id>, PMID: <pub-id pub-id-type="pmid">26415722</pub-id></citation></ref>
<ref id="ref11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fukushima</surname> <given-names>M.</given-names></name> <name><surname>Kakinuma</surname> <given-names>K.</given-names></name> <name><surname>Kawaguchi</surname> <given-names>R.</given-names></name></person-group> (<year>2002</year>). <article-title>Phylogenetic analysis of Salmonella, Shigella, and <italic>Escherichia coli</italic> strains on the basis of the gyrB gene sequence</article-title>. <source>J. Clin. Microbiol.</source> <volume>40</volume>, <fpage>2779</fpage>&#x2013;<lpage>2785</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JCM.40.8.2779-2785.2002</pub-id>, PMID: <pub-id pub-id-type="pmid">12149329</pub-id></citation></ref>
<ref id="ref12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gal&#x00E1;n-V&#x00E1;squez</surname> <given-names>E.</given-names></name> <name><surname>Luna</surname> <given-names>B.</given-names></name> <name><surname>Mart&#x00ED;nez-Antonio</surname> <given-names>A.</given-names></name></person-group> (<year>2011</year>). <article-title>The Regulatory Network of <italic>Pseudomonas aeruginosa</italic></article-title>. <source>Microb Inform. Exp.</source> <volume>1</volume>:<fpage>3</fpage>. doi: <pub-id pub-id-type="doi">10.1186/2042-5783-1-3</pub-id></citation></ref>
<ref id="ref14"><citation citation-type="other"><person-group person-group-type="author"><name><surname>Hagberg</surname> <given-names>A. A.</given-names></name> <name><surname>Schult</surname> <given-names>D. A.</given-names></name> <name><surname>Swart</surname> <given-names>P. J.</given-names></name></person-group> (<year>2008</year>). &#x201C;Exploring network structure, dynamics, and function using NetworkX,&#x201D; in <italic>Proceedings of the 7th Python in Science Conference (SciPy2008)</italic>. eds. G. Varoquaux, T. Vaught and J. Millman (Pasadena, CA USA), 11&#x2013;15.</citation></ref>
<ref id="ref15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kaleta</surname> <given-names>C.</given-names></name> <name><surname>G&#x00F6;hler</surname> <given-names>A.</given-names></name> <name><surname>Schuster</surname> <given-names>S.</given-names></name> <name><surname>Jahreis</surname> <given-names>K.</given-names></name> <name><surname>Guthke</surname> <given-names>R.</given-names></name> <name><surname>Nikolajewa</surname> <given-names>S.</given-names></name></person-group> (<year>2010</year>). <article-title>Integrative inference of gene-regulatory networks in <italic>Escherichia coli</italic> using information theoretic concepts and sequence analysis</article-title>. <source>BMC Syst. Biol.</source> <volume>4</volume>:<fpage>116</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1752-0509-4-116</pub-id>, PMID: <pub-id pub-id-type="pmid">20718955</pub-id></citation></ref>
<ref id="ref16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kapopoulou</surname> <given-names>A.</given-names></name> <name><surname>Lew</surname> <given-names>J. M.</given-names></name> <name><surname>Cole</surname> <given-names>S. T.</given-names></name></person-group> (<year>2011</year>). <article-title>The MycoBrowser portal: a comprehensive and manually annotated resource for mycobacterial genomes</article-title>. <source>Tuberculosis</source> <volume>91</volume>, <fpage>8</fpage>&#x2013;<lpage>13</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tube.2010.09.006</pub-id>, PMID: <pub-id pub-id-type="pmid">20980200</pub-id></citation></ref>
<ref id="ref17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Karlebach</surname> <given-names>G.</given-names></name> <name><surname>Shamir</surname> <given-names>R.</given-names></name></person-group> (<year>2008</year>). <article-title>Modelling and analysis of gene regulatory networks</article-title>. <source>Nat. Rev. Mol. Cell Biol.</source> <volume>9</volume>, <fpage>770</fpage>&#x2013;<lpage>780</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nrm2503</pub-id></citation></ref>
<ref id="ref18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kyrpides</surname> <given-names>N. C.</given-names></name> <name><surname>Woese</surname> <given-names>C. R.</given-names></name></person-group> (<year>1998</year>). <article-title>Archaeal translation initiation revisited: the initiation factor 2 and eukaryotic initiation factor 2B alpha-beta-delta subunit families</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>95</volume>, <fpage>3726</fpage>&#x2013;<lpage>3730</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.95.7.3726</pub-id>, PMID: <pub-id pub-id-type="pmid">9520434</pub-id></citation></ref>
<ref id="ref19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lechner</surname> <given-names>M.</given-names></name> <name><surname>Findeiss</surname> <given-names>S.</given-names></name> <name><surname>Steiner</surname> <given-names>L.</given-names></name> <name><surname>Marz</surname> <given-names>M.</given-names></name> <name><surname>Stadler</surname> <given-names>P. F.</given-names></name> <name><surname>Prohaska</surname> <given-names>S. J.</given-names></name></person-group> (<year>2011</year>). <article-title>Proteinortho: detection of (co-)orthologs in large-scale analysis</article-title>. <source>BMC Bioinformatics.</source> <volume>12</volume>:<fpage>124</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1471-2105-12-124</pub-id>, PMID: <pub-id pub-id-type="pmid">21526987</pub-id></citation></ref>
<ref id="ref20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lenz</surname> <given-names>A. R.</given-names></name> <name><surname>Gal&#x00E1;n-V&#x00E1;squez</surname> <given-names>E.</given-names></name> <name><surname>Balbinot</surname> <given-names>E.</given-names></name> <name><surname>de Abreu</surname> <given-names>F. P.</given-names></name> <name><surname>Souza de Oliveira</surname> <given-names>N.</given-names></name> <name><surname>da Rosa</surname> <given-names>L. O.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Gene Regulatory Networks of Penicillium echinulatum 2HH and Penicillium oxalicum 114-2 Inferred by a Computational Biology Approach</article-title>. <source>Front. Microbiol.</source> <volume>11</volume>:<fpage>588263</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmicb.2020.588263</pub-id>, PMID: <pub-id pub-id-type="pmid">33193246</pub-id></citation></ref>
<ref id="ref21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Ma</surname> <given-names>X.</given-names></name> <name><surname>Tang</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>D.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Liu</surname> <given-names>Z.</given-names></name></person-group> (<year>2021</year>). <article-title>Network-based analysis of virulence factors for uncovering <italic>Aeromonas veronii</italic> pathogenesis</article-title>. <source>BMC Microbiol.</source> <volume>21</volume>:<fpage>188</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12866-021-02261-8</pub-id>, PMID: <pub-id pub-id-type="pmid">34162325</pub-id></citation></ref>
<ref id="ref22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname> <given-names>A. J.</given-names></name> <name><surname>Contreras-Riquelme</surname> <given-names>S.</given-names></name> <name><surname>Dominguez</surname> <given-names>C.</given-names></name> <name><surname>Perez-Acle</surname> <given-names>T.</given-names></name></person-group> (<year>2017</year>). <article-title>LoTo: a graphlet based method for the comparison of local topology between gene regulatory networks</article-title>. <source>PeerJ.</source> <volume>5</volume>:<fpage>e3052</fpage>. doi: <pub-id pub-id-type="doi">10.7717/peerj.3052</pub-id>, PMID: <pub-id pub-id-type="pmid">28265516</pub-id></citation></ref>
<ref id="ref23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mart&#x00ED;nez-N&#x00FA;&#x00F1;ez</surname> <given-names>M. A.</given-names></name> <name><surname>Poot-Hernandez</surname> <given-names>A. C.</given-names></name> <name><surname>Rodr&#x00ED;guez-V&#x00E1;zquez</surname> <given-names>K.</given-names></name> <name><surname>Perez-Rueda</surname> <given-names>E.</given-names></name></person-group> (<year>2013</year>). <article-title>Increments and duplication events of enzymes and transcription factors influence metabolic and regulatory diversity in prokaryotes</article-title>. <source>PLoS One</source> <volume>8</volume>:<fpage>e69707</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0069707</pub-id>, PMID: <pub-id pub-id-type="pmid">23922780</pub-id></citation></ref>
<ref id="ref24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Matt&#x00E9;otti</surname> <given-names>C.</given-names></name> <name><surname>Haubruge</surname> <given-names>E.</given-names></name> <name><surname>Thonart</surname> <given-names>P.</given-names></name> <name><surname>Francis</surname> <given-names>F.</given-names></name> <name><surname>de Pauw</surname> <given-names>E.</given-names></name> <name><surname>Portetelle</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Characterization of a new &#x03B2;-glucosidase/&#x03B2;-xylosidase from the gut microbiota of the termite (Reticulitermes santonensis)</article-title>. <source>FEMS Microbiol. Lett.</source> <volume>314</volume>, <fpage>147</fpage>&#x2013;<lpage>157</lpage>. doi: <pub-id pub-id-type="doi">10.1111/j.1574-6968.2010.02161.x</pub-id>, PMID: <pub-id pub-id-type="pmid">21114521</pub-id></citation></ref>
<ref id="ref25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>M&#x00E9;tris</surname> <given-names>A.</given-names></name> <name><surname>Sudhakar</surname> <given-names>P.</given-names></name> <name><surname>Fazekas</surname> <given-names>D.</given-names></name> <name><surname>Demeter</surname> <given-names>A.</given-names></name> <name><surname>Ari</surname> <given-names>E.</given-names></name> <name><surname>Olbei</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2017</year>). <article-title>SalmoNet, an integrated network of ten <italic>Salmonella enterica</italic> strains reveals common and distinct pathways to host adaptation</article-title>. <source>NPJ Syst Biol Appl.</source> <volume>3</volume>:<fpage>31</fpage>. doi: <pub-id pub-id-type="doi">10.1038/s41540-017-0034-z</pub-id>, PMID: <pub-id pub-id-type="pmid">29057095</pub-id></citation></ref>
<ref id="ref26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Milo</surname> <given-names>R.</given-names></name> <name><surname>Shen-Orr</surname> <given-names>S.</given-names></name> <name><surname>Itzkovitz</surname> <given-names>S.</given-names></name> <name><surname>Kashtan</surname> <given-names>N.</given-names></name> <name><surname>Chklovskii</surname> <given-names>D.</given-names></name> <name><surname>Alon</surname> <given-names>U.</given-names></name></person-group> (<year>2002</year>). <article-title>Network motifs: simple building blocks of complex networks</article-title>. <source>Science</source> <volume>298</volume>, <fpage>824</fpage>&#x2013;<lpage>827</lpage>. doi: <pub-id pub-id-type="doi">10.1126/science.298.5594.824</pub-id>, PMID: <pub-id pub-id-type="pmid">12399590</pub-id></citation></ref>
<ref id="ref27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Minezaki</surname> <given-names>Y.</given-names></name> <name><surname>Homma</surname> <given-names>K.</given-names></name> <name><surname>Nishikawa</surname> <given-names>K.</given-names></name></person-group> (<year>2005</year>). <article-title>Genome-wide survey of transcription factors in prokaryotes reveals many bacteria-specific families not found in archaea</article-title>. <source>DNA Res.</source> <volume>12</volume>, <fpage>269</fpage>&#x2013;<lpage>280</lpage>. doi: <pub-id pub-id-type="doi">10.1093/dnares/dsi016</pub-id>, PMID: <pub-id pub-id-type="pmid">16769689</pub-id></citation></ref>
<ref id="ref28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moreno-Hagelsieb</surname> <given-names>G.</given-names></name> <name><surname>Collado-Vides</surname> <given-names>J.</given-names></name></person-group> (<year>2002</year>). <article-title>A powerful non-homology method for the prediction of operons in prokaryotes</article-title>. <source>Bioinformatics</source> <volume>18</volume>, <fpage>S329</fpage>&#x2013;<lpage>S336</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/18.suppl_1.s329</pub-id>, PMID: <pub-id pub-id-type="pmid">12169563</pub-id></citation></ref>
<ref id="ref29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Novichkov</surname> <given-names>P. S.</given-names></name> <name><surname>Rodionov</surname> <given-names>D. A.</given-names></name> <name><surname>Stavrovskaya</surname> <given-names>E. D.</given-names></name> <name><surname>Novichkova</surname> <given-names>E. S.</given-names></name> <name><surname>Kazakov</surname> <given-names>A. E.</given-names></name> <name><surname>Gelfand</surname> <given-names>M. S.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>RegPredict: an integrated system for regulon inference in prokaryotes by comparative genomics approach</article-title>. <source>Nucleic Acids Res.</source> <volume>38</volume>:<fpage>W299</fpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkq531</pub-id>, PMID: <pub-id pub-id-type="pmid">20542910</pub-id></citation></ref>
<ref id="ref30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oliver</surname> <given-names>S.</given-names></name></person-group> (<year>2000</year>). <article-title>Guilt-by-association goes global</article-title>. <source>Nature</source> <volume>403</volume>, <fpage>601</fpage>&#x2013;<lpage>602</lpage>. doi: <pub-id pub-id-type="doi">10.1038/35001165</pub-id>, PMID: <pub-id pub-id-type="pmid">10688178</pub-id></citation></ref>
<ref id="ref31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Otasek</surname> <given-names>D.</given-names></name> <name><surname>Morris</surname> <given-names>J. H.</given-names></name> <name><surname>Bou&#x00E7;as</surname> <given-names>J.</given-names></name> <name><surname>Pico</surname> <given-names>A. R.</given-names></name> <name><surname>Demchak</surname> <given-names>B.</given-names></name></person-group> (<year>2019</year>). <article-title>Cytoscape Automation: empowering workflow-based network analysis</article-title>. <source>Genome Biol.</source> <volume>20</volume>:<fpage>185</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s13059-019-1758-4</pub-id>, PMID: <pub-id pub-id-type="pmid">31477170</pub-id></citation></ref>
<ref id="ref32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Perez</surname> <given-names>J. C.</given-names></name> <name><surname>Groisman</surname> <given-names>E. A.</given-names></name></person-group> (<year>2009</year>). <article-title>Evolution of transcriptional regulatory circuits in bacteria</article-title>. <source>Cell</source> <volume>138</volume>, <fpage>233</fpage>&#x2013;<lpage>244</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.cell.2009.07.002</pub-id>, PMID: <pub-id pub-id-type="pmid">19632175</pub-id></citation></ref>
<ref id="ref33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>P&#x00E9;rez-Rueda</surname> <given-names>E.</given-names></name> <name><surname>Janga</surname> <given-names>S. C.</given-names></name></person-group> (<year>2010</year>). <article-title>Identification and genomic analysis of transcription factors in archaeal genomes exemplifies their functional architecture and evolutionary origin</article-title>. <source>Mol. Biol. Evol.</source> <volume>27</volume>, <fpage>1449</fpage>&#x2013;<lpage>1459</lpage>. doi: <pub-id pub-id-type="doi">10.1093/molbev/msq033</pub-id>, PMID: <pub-id pub-id-type="pmid">20123795</pub-id></citation></ref>
<ref id="ref34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>P&#x00E9;rez-Rueda</surname> <given-names>E.</given-names></name> <name><surname>Janga</surname> <given-names>S. C.</given-names></name> <name><surname>Mart&#x00ED;nez-Antonio</surname> <given-names>A.</given-names></name></person-group> (<year>2009</year>). <article-title>Scaling relationship in the gene content of transcriptional machinery in bacteria</article-title>. <source>Mol. BioSyst.</source> <volume>5</volume>, <fpage>1494</fpage>&#x2013;<lpage>1501</lpage>. doi: <pub-id pub-id-type="doi">10.1039/b907384a</pub-id>, PMID: <pub-id pub-id-type="pmid">19763344</pub-id></citation></ref>
<ref id="ref35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Poudel</surname> <given-names>S.</given-names></name> <name><surname>Tsunemoto</surname> <given-names>H.</given-names></name> <name><surname>Seif</surname> <given-names>Y.</given-names></name> <name><surname>Sastry</surname> <given-names>A. V.</given-names></name> <name><surname>Szubin</surname> <given-names>R.</given-names></name> <name><surname>Xu</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>Revealing 29 sets of independently modulated genes in <italic>Staphylococcus aureus</italic>, their regulators, and role in key physiological response</article-title>. <source>Proc. Natl. Acad. Sci. U. S. A.</source> <volume>117</volume>, <fpage>17228</fpage>&#x2013;<lpage>17239</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.2008413117</pub-id>, PMID: <pub-id pub-id-type="pmid">32616573</pub-id></citation></ref>
<ref id="ref36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ravcheev</surname> <given-names>D. A.</given-names></name> <name><surname>Best</surname> <given-names>A. A.</given-names></name> <name><surname>Tintle</surname> <given-names>N.</given-names></name> <name><surname>Dejongh</surname> <given-names>M.</given-names></name> <name><surname>Osterman</surname> <given-names>A. L.</given-names></name> <name><surname>Novichkov</surname> <given-names>P. S.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Inference of the transcriptional regulatory network in <italic>Staphylococcus aureus</italic> by integration of experimental and genomics-based evidence</article-title>. <source>J. Bacteriol.</source> <volume>193</volume>, <fpage>3228</fpage>&#x2013;<lpage>3240</lpage>. doi: <pub-id pub-id-type="doi">10.1128/JB.00350-11</pub-id>, PMID: <pub-id pub-id-type="pmid">21531804</pub-id></citation></ref>
<ref id="ref37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Santos-Zavaleta</surname> <given-names>A.</given-names></name> <name><surname>Perez-Rueda</surname> <given-names>E.</given-names></name> <name><surname>S&#x00E1;nchez-P&#x00E9;rez</surname> <given-names>M.</given-names></name> <name><surname>Vel&#x00E1;zquez-Ram&#x00ED;rez</surname> <given-names>D. A.</given-names></name> <name><surname>Collado-Vides</surname> <given-names>J.</given-names></name></person-group> (<year>2019a</year>). <article-title>Tracing the phylogenetic history of the Crl regulon through the Bacteria and Archaea genomes</article-title>. <source>BMC Genomics</source> <volume>20</volume>:<fpage>299</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12864-019-5619-z</pub-id></citation></ref>
<ref id="ref38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Santos-Zavaleta</surname> <given-names>A.</given-names></name> <name><surname>Salgado</surname> <given-names>H.</given-names></name> <name><surname>Gama-Castro</surname> <given-names>S.</given-names></name> <name><surname>S&#x00E1;nchez-P&#x00E9;rez</surname> <given-names>M.</given-names></name> <name><surname>G&#x00F3;mez-Romero</surname> <given-names>L.</given-names></name> <name><surname>Ledezma-Tejeida</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2019b</year>). <article-title>RegulonDB v 10.5: tackling challenges to unify classic and high throughput knowledge of gene regulation in <italic>E. coli</italic> K-12</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>D212</fpage>&#x2013;<lpage>D220</lpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gky1077</pub-id></citation></ref>
<ref id="ref39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sanz</surname> <given-names>J.</given-names></name> <name><surname>Navarro</surname> <given-names>J.</given-names></name> <name><surname>Arbu&#x00E9;s</surname> <given-names>A.</given-names></name> <name><surname>Mart&#x00ED;n</surname> <given-names>C.</given-names></name> <name><surname>Mariju&#x00E1;n</surname> <given-names>P. C.</given-names></name> <name><surname>Moreno</surname> <given-names>Y.</given-names></name></person-group> (<year>2011</year>). <article-title>The transcriptional regulatory network of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>PLoS One</source> <volume>6</volume>:<fpage>e22178</fpage>. doi: <pub-id pub-id-type="doi">10.1371/journal.pone.0022178</pub-id>, PMID: <pub-id pub-id-type="pmid">21818301</pub-id></citation></ref>
<ref id="ref40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seitzer</surname> <given-names>P.</given-names></name> <name><surname>Yao</surname> <given-names>A. I.</given-names></name> <name><surname>Cisneros</surname> <given-names>A.</given-names></name> <name><surname>Facciotti</surname> <given-names>M. T.</given-names></name></person-group> (<year>2020</year>). <article-title>The Exploration of Novel Regulatory Relationships Drives Haloarchaeal Operon-Like Structural Dynamics over Short Evolutionary Distances</article-title>. <source>Microorganisms</source> <volume>8</volume>:<fpage>1900</fpage>. doi: <pub-id pub-id-type="doi">10.3390/microorganisms8121900</pub-id>, PMID: <pub-id pub-id-type="pmid">33266086</pub-id></citation></ref>
<ref id="ref41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shannon</surname> <given-names>P.</given-names></name> <name><surname>Markiel</surname> <given-names>A.</given-names></name> <name><surname>Ozier</surname> <given-names>O.</given-names></name> <name><surname>Baliga</surname> <given-names>N. S.</given-names></name> <name><surname>Wang</surname> <given-names>J. T.</given-names></name> <name><surname>Ramage</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2003</year>). <article-title>Cytoscape: a software environment for integrated models of biomolecular interaction networks</article-title>. <source>Genome Res.</source> <volume>13</volume>, <fpage>2498</fpage>&#x2013;<lpage>2504</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.1239303</pub-id>, PMID: <pub-id pub-id-type="pmid">14597658</pub-id></citation></ref>
<ref id="ref42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sierro</surname> <given-names>N.</given-names></name> <name><surname>Makita</surname> <given-names>Y.</given-names></name> <name><surname>de Hoon</surname> <given-names>M.</given-names></name> <name><surname>Nakai</surname> <given-names>K.</given-names></name></person-group> (<year>2008</year>). <article-title>DBTBS: a database of transcriptional regulation in <italic>Bacillus subtilis</italic> containing upstream intergenic conservation information</article-title>. <source>Nucleic Acids Res.</source> <volume>36</volume>:<fpage>D93</fpage>. doi: <pub-id pub-id-type="doi">10.1093/nar/gkm910</pub-id>, PMID: <pub-id pub-id-type="pmid">17962296</pub-id></citation></ref>
<ref id="ref43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Soberanes-Guti&#x00E9;rrez</surname> <given-names>C. V.</given-names></name> <name><surname>P&#x00E9;rez-Rueda</surname> <given-names>E.</given-names></name> <name><surname>Ru&#x00ED;z-Herrera</surname> <given-names>J.</given-names></name> <name><surname>Galan-Vasquez</surname> <given-names>E.</given-names></name></person-group> (<year>2021</year>). <article-title>Identifying Genes Devoted to the Cell Death Process in the Gene Regulatory Network of <italic>Ustilago maydis</italic></article-title>. <source>Front. Microbiol.</source> <volume>12</volume>:<fpage>680290</fpage>. doi: <pub-id pub-id-type="doi">10.3389/fmicb.2021.680290</pub-id>, PMID: <pub-id pub-id-type="pmid">34093501</pub-id></citation></ref>
<ref id="ref44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>Q.</given-names></name> <name><surname>Grene</surname> <given-names>R.</given-names></name> <name><surname>Heath</surname> <given-names>L. S.</given-names></name> <name><surname>Li</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>Identification of regulatory modules in genome scale transcription regulatory networks</article-title>. <source>BMC Syst. Biol.</source> <volume>11</volume>:<fpage>140</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12918-017-0493-2</pub-id>, PMID: <pub-id pub-id-type="pmid">29246163</pub-id></citation></ref>
<ref id="ref45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sueda</surname> <given-names>R.</given-names></name> <name><surname>Yoshida</surname> <given-names>K.</given-names></name> <name><surname>Onodera</surname> <given-names>M.</given-names></name> <name><surname>Fukui</surname> <given-names>T.</given-names></name> <name><surname>Yatsunami</surname> <given-names>R.</given-names></name> <name><surname>Nakamura</surname> <given-names>S.</given-names></name></person-group> (<year>2021</year>). <article-title>Characterization of a GlgC homolog from extremely halophilic archaeon <italic>Haloarcula japonica</italic></article-title>. <source>Biosci. Biotechnol. Biochem.</source> <volume>85</volume>, <fpage>1441</fpage>&#x2013;<lpage>1447</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bbb/zbab050</pub-id>, PMID: <pub-id pub-id-type="pmid">33749776</pub-id></citation></ref>
<ref id="ref46"><citation citation-type="journal"><person-group person-group-type="author"><collab id="coll1">The DREAM5 Consortium</collab><name><surname>Marbach</surname> <given-names>D.</given-names></name> <name><surname>Costello</surname> <given-names>J. C.</given-names></name> <name><surname>K&#x00FC;ffner</surname> <given-names>R.</given-names></name> <name><surname>Vega</surname> <given-names>N. M.</given-names></name> <name><surname>Prill</surname> <given-names>R. J.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>Wisdom of crowds for robust gene network inference</article-title>. <source>Nat. Methods</source> <volume>9</volume>, <fpage>796</fpage>&#x2013;<lpage>804</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nmeth.2016</pub-id>, PMID: <pub-id pub-id-type="pmid">22796662</pub-id></citation></ref>
<ref id="ref47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Virtanen</surname> <given-names>P.</given-names></name> <name><surname>Gommers</surname> <given-names>R.</given-names></name> <name><surname>Oliphant</surname> <given-names>T. E.</given-names></name> <name><surname>Haberland</surname> <given-names>M.</given-names></name> <name><surname>Reddy</surname> <given-names>T.</given-names></name> <name><surname>Cournapeau</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2020</year>). <article-title>SciPy 1.0 Contributors. SciPy 1.0: fundamental algorithms for scientific computing in Python</article-title>. <source>Nat. Methods</source> <volume>17</volume>, <fpage>261</fpage>&#x2013;<lpage>272</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41592-019-0686-2</pub-id>, PMID: <pub-id pub-id-type="pmid">32015543</pub-id></citation></ref>
<ref id="ref48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>H.</given-names></name> <name><surname>Luscombe</surname> <given-names>N. M.</given-names></name> <name><surname>Lu</surname> <given-names>H. X.</given-names></name> <name><surname>Zhu</surname> <given-names>X.</given-names></name> <name><surname>Xia</surname> <given-names>Y.</given-names></name> <name><surname>Han</surname> <given-names>J. D.</given-names></name> <etal/></person-group>. (<year>2004</year>). <article-title>Annotation transfer between genomes: protein-protein interologs and protein-DNA regulogs</article-title>. <source>Genome Res.</source> <volume>14</volume>, <fpage>1107</fpage>&#x2013;<lpage>1118</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.1774904</pub-id>, PMID: <pub-id pub-id-type="pmid">15173116</pub-id></citation></ref>
<ref id="ref49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>P.</given-names></name> <name><surname>Ye</surname> <given-names>Z.</given-names></name> <name><surname>Ye</surname> <given-names>C.</given-names></name> <name><surname>Zou</surname> <given-names>H.</given-names></name> <name><surname>Gao</surname> <given-names>Z.</given-names></name> <name><surname>Pan</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>OmpW is positively regulated by iron via Fur, and negatively regulated by SoxS contribution to oxidative stress resistance in <italic>Escherichia coli</italic></article-title>. <source>Microb. Pathog.</source> <volume>138</volume>:<fpage>103808</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.micpath.2019.103808</pub-id>, PMID: <pub-id pub-id-type="pmid">31634530</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn0004">
<p><sup>1</sup><ext-link xlink:href="https://dbtbs.hgc.jp" ext-link-type="uri">https://dbtbs.hgc.jp</ext-link></p>
</fn>
<fn id="fn0005">
<p><sup>2</sup><ext-link xlink:href="http://regulondb.ccg.unam.mx" ext-link-type="uri">http://regulondb.ccg.unam.mx</ext-link></p>
</fn>
<fn id="fn0006">
<p><sup>3</sup><ext-link xlink:href="http://www.regulome.pcyt.unam.mx" ext-link-type="uri">www.regulome.pcyt.unam.mx</ext-link></p>
</fn>
<fn id="fn0007">
<p><sup>4</sup><ext-link xlink:href="http://uniprot.org" ext-link-type="uri">uniprot.org</ext-link></p>
</fn>
</fn-group>
</back>
</article>