<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1223830</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2023.1223830</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Are there double knots in proteins? Prediction and <italic>in vitro</italic> verification based on TrmD-Tm1570 fusion from <italic>C. nitroreducens</italic>
</article-title>
<alt-title alt-title-type="left-running-head">Perlinska et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fmolb.2023.1223830">10.3389/fmolb.2023.1223830</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Perlinska</surname>
<given-names>Agata P.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2525741/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nguyen</surname>
<given-names>Mai Lan</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2313465/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Pilla</surname>
<given-names>Smita P.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Staszor</surname>
<given-names>Emilia</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2315002/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lewandowska</surname>
<given-names>Iwona</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bernat</surname>
<given-names>Agata</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Purta</surname>
<given-names>El&#x17c;bieta</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Augustyniak</surname>
<given-names>Rafal</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1591129/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bujnicki</surname>
<given-names>Janusz M.</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Sulkowska</surname>
<given-names>Joanna I.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Centre of New Technologies</institution>, <institution>University of Warsaw</institution>, <addr-line>Warsaw</addr-line>, <country>Poland</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Polish-Japanese Academy of Information Technology</institution>, <addr-line>Warsaw</addr-line>, <country>Poland</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Faculty of Chemistry</institution>, <institution>University of Warsaw</institution>, <addr-line>Warsaw</addr-line>, <country>Poland</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Laboratory of Bioinformatics and Protein Engineering</institution>, <institution>International Institute of Molecular and Cell Biology in Warsaw</institution>, <addr-line>Warsaw</addr-line>, <country>Poland</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/132812/overview">Piero Andrea Temussi</ext-link>, University of Naples Federico II, Italy</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1110572/overview">Adam Liwo</ext-link>, University of Gdansk, Poland</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/154539/overview">Peter Virnau</ext-link>, Johannes Gutenberg University Mainz, Germany</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Joanna I. Sulkowska, <email>jsulkowska@cent.uw.edu.pl</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>06</day>
<month>06</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>10</volume>
<elocation-id>1223830</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>05</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>04</day>
<month>10</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Perlinska, Nguyen, Pilla, Staszor, Lewandowska, Bernat, Purta, Augustyniak, Bujnicki and Sulkowska.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Perlinska, Nguyen, Pilla, Staszor, Lewandowska, Bernat, Purta, Augustyniak, Bujnicki and Sulkowska</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>We have been aware of the existence of knotted proteins for over 30 years&#x2014;but it is hard to predict what is the most complicated knot that can be formed in proteins. Here, we show new and the most complex knotted topologies recorded to date&#x2014;double trefoil knots (3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub>). We found five domain arrangements (architectures) that result in a doubly knotted structure in almost a thousand proteins. The double knot topology is found in knotted membrane proteins from the CaCA family, that function as ion transporters, in the group of carbonic anhydrases that catalyze the hydration of carbon dioxide, and in the proteins from the SPOUT superfamily that gathers 3<sub>1</sub> knotted methyltransferases with the active site-forming knot. For each family, we predict the presence of a double knot using AlphaFold and RoseTTaFold structure prediction. In the case of the TrmD-Tm1570 protein, which is a member of SPOUT superfamily, we show that it folds <italic>in vitro</italic> and is biologically active. Our results show that this protein forms a homodimeric structure and retains the ability to modify tRNA, which is the function of the single-domain TrmD protein. However, how the protein folds and is degraded remains unknown.</p>
</abstract>
<kwd-group>
<kwd>methyltransferase</kwd>
<kwd>composite knot</kwd>
<kwd>SPOUT</kwd>
<kwd>domain</kwd>
<kwd>evolution</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Structural Biology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>The presence of knots in proteins has been known for almost 30 years, but only a few types of knots were identified over the years: 3<sub>1</sub>, 4<sub>1</sub>, 5<sub>2</sub>, and 6<sub>1</sub> (<xref ref-type="bibr" rid="B20">Eriksson et al., 1988</xref>; <xref ref-type="bibr" rid="B54">Taylor, 2000</xref>; <xref ref-type="bibr" rid="B59">Wagner et al., 2005</xref>; <xref ref-type="bibr" rid="B17">Das et al., 2006</xref>; <xref ref-type="bibr" rid="B51">Schmidberger et al., 2008</xref>; <xref ref-type="bibr" rid="B5">B&#xf6;linger et al., 2010</xref>; <xref ref-type="bibr" rid="B56">Thiruselvam et al., 2017</xref>; <xref ref-type="bibr" rid="B53">Sulkowska, 2020</xref>). The most commonly encountered knot is the trefoil (3<sub>1</sub>), which is found in more than 85% of knotted structures. However, the number of knotted proteins is not high (185) which makes up about 0.3% of all the proteins with structures deposited in the PDB database (<xref ref-type="bibr" rid="B27">Jamroz et al., 2015</xref>). This raises at least two fundamental questions. First, why is the number of knotted proteins so low, even though it is expected from polymer physics to be much higher (<xref ref-type="bibr" rid="B35">Lua and Grosberg 2006</xref>)? It could be due to the complicated folding process needed to form the knot, including threading, which is energetically costly (<xref ref-type="bibr" rid="B62">Yeates et al., 2007</xref>), or maybe entanglement is disadvantageous in the process of protein degradation. However, since knotted domains frequently contain binding sites for substrates (<xref ref-type="bibr" rid="B53">Sulkowska, 2020</xref>), their presence is essential for certain proteins, such as methyltransferases (MTs) (<xref ref-type="bibr" rid="B57">Tkaczuk et al., 2007</xref>; <xref ref-type="bibr" rid="B9">Christian et al., 2016</xref>; <xref ref-type="bibr" rid="B47">Perlinska et al., 2020b</xref>). The second question is why proteins can only form simple types of knots? Why not more complex knots with more crossings or multiple separate knots since multi-domain proteins do exist? Both questions are not trivial to answer. Herein, we will try to solve the second one.</p>
<p>In this paper, we expand our knowledge of protein structure complexity and possible folds by presenting newly identified families of proteins with two separate knots (a so-called composite knot; <xref ref-type="table" rid="T1">Table 1</xref>). For each family, we determined the structures of doubly knotted proteins using AlphaFold 2 and RoseTTaFold (<xref ref-type="fig" rid="F1">Figure 1</xref>), and in the case of one family (TrmD-Tm1570), we performed a more in-depth <italic>in silico</italic> and <italic>in vitro</italic> study based on <italic>Calditerrivibrio nitroreducens</italic>. All of the proteins with composite knots that we found have two 3<sub>1</sub> knots [based on AlphaKnot database (<xref ref-type="bibr" rid="B40">Niemyska et al., 2022</xref>)], which is expected by trefoil&#x2019;s prevalence in the knotted proteins world (<xref ref-type="bibr" rid="B15">Dabrowski-Tumanski et al., 2019</xref>). In our search, we have not identified any other structures involving two sequential knots, other than two trefoils. However, just as the single-knotted proteins, the composite knots are also not commonly found in a proteome, but the scale is different&#x2014;a well-studied knotted MT called tRNA methyltransferase D (TrmD) is a universal protein for all Bacteria (<xref ref-type="bibr" rid="B26">Ito et al., 2015</xref>; <xref ref-type="bibr" rid="B63">Zhong et al., 2019</xref>), but the presence of proteins with composite knots is limited to specific organisms, such as <italic>Desulfovibrio vulgaris</italic> or <italic>Oleidesulfovibrio alaskensis</italic>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Proteins with composite knots.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Superfamily</th>
<th align="center">Fusion architecture (Pfam ID)</th>
<th align="center">No. proteins</th>
<th align="center">Example protein (UniProtKB ID)</th>
<th align="right">Knot type</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Carbonic anhydrase</td>
<td align="center">PF00194-PF00194</td>
<td align="center">686</td>
<td align="center">A0A0B7AKD5</td>
<td align="right">3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub>
</td>
</tr>
<tr>
<td align="left">CaCA</td>
<td align="center">PF01699-PF01699-PF01699-PF01699</td>
<td align="center">24</td>
<td align="center">A0A179I9N9</td>
<td align="right">3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub>
</td>
</tr>
<tr>
<td align="left">SPOUT</td>
<td align="center">PF00588-PF00588</td>
<td align="center">125</td>
<td align="center">Q4DMW6</td>
<td align="right">3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub>
</td>
</tr>
<tr>
<td align="left">SPOUT (Nep1-Nep1)</td>
<td align="center">PF03587-PF03587</td>
<td align="center">34</td>
<td align="center">A0A498KD62</td>
<td align="right">3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub>
</td>
</tr>
<tr>
<td align="left">SPOUT (TrmD-Tm1570)</td>
<td align="center">PF01746-PF09936</td>
<td align="center">66</td>
<td align="center">E4THH1</td>
<td align="right">3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The majority of the proteins with composite knots represent the SPOUT superfamily, although in most cases the recognition of specific proteins behind that architecture was not possible. Reported Pfam IDs are of entangled domains.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Predicted single chain structures of the fusion proteins. <bold>(A)</bold> Carbonic anhydrase (PF00194-PF00194; UniProtKB ID: A0A0B7AKD5) <bold>(B)</bold> Protein from Ca<sup>2&#x2b;</sup>: Cation Antiporter (CaCA) family (UniProtKB ID: A0A0L0BYW8). <bold>(C)</bold> Protein with PF00588-PF00588 architecture (UniProtKB ID: Q4DMW6). <bold>(D)</bold> Nep1-Nep1 protein (PF03587-PF03587 architecture; UniProtKB ID: A0A498KD62). <bold>(E)</bold> TrmD-Tm1570 protein (PF01746-PF09936 architecture; UniProtKB ID: E4THH1). All the models were predicted with AlphaFold 2. Knotted regions are shown with rainbow coloring and their reduced structures were obtained with Knot_pull package (<xref ref-type="bibr" rid="B28">Jarmolinska et al., 2020</xref>).</p>
</caption>
<graphic xlink:href="fmolb-10-1223830-g001.tif"/>
</fig>
<p>Thus we showed that proteins can adopt more complex structures. So, the rarity of knotted proteins might be connected with their complex topology and folding pathway. The knots in proteins (with determined 3D structure) identified to date are exclusively of twist type (<xref ref-type="bibr" rid="B15">Dabrowski-Tumanski et al., 2019</xref>), which means that the rate-limiting threading during protein folding occurs only once (<xref ref-type="bibr" rid="B55">Taylor, 2007</xref>; <xref ref-type="bibr" rid="B62">Yeates et al., 2007</xref>; <xref ref-type="bibr" rid="B5">B&#xf6;linger et al., 2010</xref>; <xref ref-type="bibr" rid="B53">Sulkowska, 2020</xref>). With structures containing two knots (regardless of their type), the threading must happen at least twice, which is a substantial energetic cost for the cell. Therefore, doubly knotted proteins may provide additional benefits over single-knotted proteins to be advantageous for the cell (<xref ref-type="bibr" rid="B16">Dabrowski-Tumanski et al., 2016b</xref>; <xref ref-type="bibr" rid="B53">Sulkowska, 2020</xref>). This advantage might be connected to the reason for many other proteins fusing together&#x2014;these proteins are interacting and forming functional complexes while remaining separate (<xref ref-type="bibr" rid="B8">Chia and Kolatkar, 2004</xref>; <xref ref-type="bibr" rid="B43">Pasek et al., 2006</xref>; <xref ref-type="bibr" rid="B7">Buljan et al., 2010</xref>; <xref ref-type="bibr" rid="B37">Marsh et al., 2013</xref>). Thus, when their genes are nearby or are fused, they can be expressed together (both in time and place), which is energetically favorable.</p>
<p>Herein, having discussed the general characteristics of four of the five doubly knot families, we focus on one family of doubly knotted proteins&#x2014;a TrmD-Tm1570 fusion, which joins two domains with MT activity. Both of the domains function also as single proteins (<xref ref-type="bibr" rid="B57">Tkaczuk et al., 2007</xref>; <xref ref-type="bibr" rid="B32">Kim et al., 2009</xref>; <xref ref-type="bibr" rid="B44">Perlinska et al., 2020a</xref>). To better understand the structure, evolution and biological function of this fusion on doubly knotted TrmD-Tm1570 from <italic>C. nitroreducens</italic> (<italic>Cn</italic>TrmD-Tm1570), we conducted an <italic>in vitro</italic> study of this protein&#x2019;s activity and an extensive bioinformatics analysis of sequences and structures of its related proteins. Our results show that the <italic>Cn</italic>TrmD-Tm1570 protein is a functional homodimeric protein that methylates tRNA, and thus the <italic>Cn</italic>TrmD domain is fully operational (<xref ref-type="bibr" rid="B9">Christian et al., 2016</xref>). However, the function of the second domain (<italic>Cn</italic>Tm1570) is not clear except that it is similar to 2&#x2019;O ribose-modifying knotted MTs (<xref ref-type="bibr" rid="B32">Kim et al., 2009</xref>). Moreover, how the double knotted proteins fold, and whether they can be easily degraded are going to be new open fundamental questions.</p>
</sec>
<sec sec-type="materials|methods" id="s2">
<title>2 Materials and methods</title>
<sec id="s2-1">
<title>2.1 Search for double knotted proteins</title>
<p>First, we obtained information about domains found in entangled protein structures from the KnotProt database (<xref ref-type="bibr" rid="B15">Dabrowski-Tumanski et al., 2019</xref>). Next, we calculated the minimal length of each domain, which was based on the shortest knotted region of the domain. This step was important for finding proteins long enough to be doubly knotted. The implicated domains were classified into three groups based on their contribution in creating a knot, slipknot, or both. We then retrieved all the sequences present in the Pfam database (<xref ref-type="bibr" rid="B38">Mistry et al., 2021</xref>), which consisted of at least two entangled functional regions, and created a list of proteins divided by their domain architecture. We selected the proteins with the highest possibility of containing a composite knot. From each domain architecture type, we chose a few sequences (also regarding their length). We considered representative proteins to form a composite knot when their closest homolog with a known 3D structure contained at least one entanglement. Therefore, we identified the most similar sequences within the AlphaFold Protein Structure Database using the Basic Local Alignment Search Tool (BLAST) in ChimeraX 1.3 (<xref ref-type="bibr" rid="B48">Pettersen et al., 2021</xref>). The best hit was checked based on its e-value and presence in the entanglements. If the e-value was significant (<italic>e</italic> &#x2212; <italic>value</italic> &#x3c; 10<sup>&#x2013;3</sup>) and the homolog turned out to be knotted, the examined protein was modeled in AlphaFold 2. It is worth noting that all found homologs had e-values between 1e-07 and 0.0 (with most being between 1e-30 and 0.0). Obtained structures were additionally analyzed using the AlphaKnot server.</p>
</sec>
<sec id="s2-2">
<title>2.2 Dataset preparation and quantification of dimer interfaces</title>
<p>The PDB (<xref ref-type="bibr" rid="B4">Berman et al., 2000</xref>) was scanned for entries representing TrmD as well as Tm1570 in different source organisms with a resolution better than 4.0&#xa0;&#xc5;. We identified the pairwise interactions and quantified the interface area (B) using the following equation:<disp-formula id="e1">
<mml:math id="m1">
<mml:mi>B</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>12</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>.</mml:mo>
</mml:math>
<label>(1)</label>
</disp-formula>Here, the first two terms represent the solvent accessible surface area (SASA) of the molecules in isolated form and the last term represents the SASA of their binary complex. SASA values were calculated using the program NACCESS (<xref ref-type="bibr" rid="B25">Hubbard and Thornton, 1993</xref>), which implements the Lee and Richards algorithm (<xref ref-type="bibr" rid="B33">Lee and Richards, 1971</xref>).</p>
</sec>
<sec id="s2-3">
<title>2.3 Sequence analysis</title>
<p>The sequences of fusion proteins were retrieved from the UniProt Knowledge base (UniProtKB) (<xref ref-type="bibr" rid="B11">Consortium, 2021</xref>), by searching for both protein families of TrmD (Pfam id: PF01746) and Tm1570 (PF09936) proteins. Then the sequences were clustered using the CD-HIT suite (<xref ref-type="bibr" rid="B24">Huang et al., 2010</xref>) (three runs, with sequence identity cutoff ranges from 0.9 to 0.7). Multiple sequence alignment was done using Clustal Omega (<xref ref-type="bibr" rid="B36">Madeira et al., 2022</xref>) and the conservation of residues was analyzed using UGENE (<xref ref-type="bibr" rid="B42">Okonechnikov et al., 2012</xref>).</p>
</sec>
<sec id="s2-4">
<title>2.4 Molecular docking</title>
<p>The tRNA from <italic>Haemophilus influenzae</italic> (<italic>Hi</italic>TrmD) (PDB id: 4YVI) was extracted and docked to the TrmD domain of the fusion protein with known constraint (tRNA binding motif) using the HDOCK server (<xref ref-type="bibr" rid="B61">Yan et al., 2017</xref>). The C<italic>&#x3b1;</italic> root mean square deviation (RMSD) to the PDB structure 4YVI was used to filter the fusion-tRNA complexes, and the best superposed complex was chosen for further study. Following that, four ligands (S-adenosylmethionine; SAM) were docked to the respective knotted domains of TrmD and Tm1570 in the fusion-tRNA protein-RNA complex using the GLIDE program in the Schr&#x151;dinger software (Maestro 12.5). The fusion-tRNA structure was prepared using the Protein Preparation Wizard. Prior to docking to Tm1570 we added a water molecule, which based on Tm1570 crystals, is important for a proper pose of SAM. We also rotated the side chain of Asn409 accordingly to Tm1570 crystal structures and minimized the protein, in order for the residue not to block the binding site. Docking to Tm1570 was performed with H-bond constraints defined on the amine group of Ala357 and the backbone oxygens of Ile402 and Asn409.</p>
</sec>
<sec id="s2-5">
<title>2.5 Structure prediction with AlphaFold and RoseTTaFold cross-validation</title>
<p>Structures were predicted with our locally installed newest AlphaFold 2 version (2.1.0). Proteins with potential composite knots based on the AlphaFold 2 calculations were validated on the RoseTTaFold server (<xref ref-type="bibr" rid="B2">Baek et al., 2021</xref>) using default parameters. Since RoseTTaFold does not accept sequences with more than 1,200 residues, the larger proteins were modeled within this range. All the modelled structures were deposited in the Github repository (<ext-link ext-link-type="uri" xlink:href="https://github.com/ilbsm/Double_knots_structures/tree/main">https://github.com/ilbsm/Double_knots_structures/tree/main</ext-link>).</p>
</sec>
<sec id="s2-6">
<title>2.6 Experimental procedures</title>
<p>Codon-optimized gene coding for TrmD-Tm1570 was synthesized (GenArt, Thermo Scientific) and inserted into the pET28b expression vector. Transformed <italic>E. coli</italic> BL21 (DE3) RIL cells were grown at 37&#xb0;C until OD<sub>600</sub> reached 0.8. After induction with 1&#xa0;mM IPTG the temperature was decreased to 18&#xb0;C and bacteria were harvested 18&#xa0;h later. The cell pellet was resuspended in a lysis buffer containing 6&#xa0;M urea, 20&#xa0;mM Hepes, 300&#xa0;mM NaCl, 10&#xa0;mM imidazole and 0,01% NaN3. The protein was purified in a HisTrap HP 5&#xa0;mL column (GE Healthcare). After elution, the protein was dialyzed for at least 5&#xa0;h against 2&#xa0;L of buffer (50&#xa0;mM Hepes, 300&#xa0;mM NaCl, 20% glycerol, 0.01% NaN3, 2&#xa0;mM DTT, pH 7.4) in each concentration of urea containing 2&#xa0;M, 1&#xa0;M, 0.8 M, 0.6 M, 0&#xa0;M (5 different buffers). The final purification step involved a preparative Superdex 75 column with the running buffer containing 50&#xa0;mM Hepes, 300&#xa0;mM NaCl, 10% glycerol, 1&#xa0;mM TCEP, pH 7.4. The pure protein was flash-frozen in liquid nitrogen and stored at &#x2212;80&#xb0;C. Activity assays were performed with the MTase-Glo kit (Promega) according to the manufacturer&#x2019;s instructions. The luminescence was performed on a Synergy H1 plate reader (Biotek). Further details are given in SI Materials and Methods.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<p>Our search for composite knots in proteins is based on two approaches, with direct and indirect use of available protein structures. The indirect approach is focused on the protein sequence and domain annotation. We use the KnotProt database (<xref ref-type="bibr" rid="B15">Dabrowski-Tumanski et al., 2019</xref>) and the information it contains about knotted proteins along with the location of the knot in their structures. We associate the presence of a knot with the domain in which it is located. With this data, we searched for multi-domain proteins with more than one entangled domain. For this purpose, we use the Pfam database that contains protein domains grouped into families and superfamilies. This resulted in finding five domain architectures that could possess double knots (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<p>In our second approach, we analyze the available protein structures directly. Thanks to the ever-growing number of predicted models with the machine learning methods like AlphaFold (<xref ref-type="bibr" rid="B31">Jumper et al., 2021</xref>; <xref ref-type="bibr" rid="B58">Varadi et al., 2022</xref>) and our AlphaKnot database that analyses their topology (<xref ref-type="bibr" rid="B40">Niemyska et al., 2022</xref>), we were able to find proteins with double knots based on their 3D structure. In order to minimize the probability of finding artifacts, we used only models predicted with high confidence (pLDDT score). We did not encounter any other fusion architectures but found seven additional proteins for the PF00588-PF00588 architecture, that we already found with the first method (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<p>Finally, we used locally installed AlphaFold 2 (original model; 2.1.0) to predict the structures of selected proteins (at least two members from each family). Moreover, for additional verification, we used RoseTTaFold to predict structures for the same protein sequences and compare their topologies. The example doubly knotted protein from each of the architectures is presented in <xref ref-type="fig" rid="F1">Figure 1</xref> and <xref ref-type="table" rid="T1">Table 1</xref>. The other proteins with predicted doubly knotted structures are shown in the <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>).</p>
<p>All of the architectures we found represent composite 3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub> knots, which is expected since the trefoil (3<sub>1</sub>) knot is the most common knot type found in proteins. As anticipated, the majority of the architectures are formed by domains from the SPOUT superfamily since it is the biggest group of deeply knotted 3<sub>1</sub> proteins (<xref ref-type="bibr" rid="B53">Sulkowska, 2020</xref>). Moreover, we found composite knots also within membrane proteins, namely, the ion transporters.</p>
<sec id="s3-1">
<title>3.1 Carbonic anhydrases</title>
<p>A substantial number of composite knots is found within carbonic anhydrases (<xref ref-type="bibr" rid="B64">Sayre et al., 2011</xref>; <xref ref-type="bibr" rid="B65">Dzubiella, 2013</xref>). This is a well-known group of knotted proteins with many structures resolved experimentally. Most of these enzymes have a single domain (PF00194) that contains either a deep or a shallow 3<sub>1</sub> knot (human carbonic anhydrase IX and II, respectively). The fusion of two such domains results in a double 3<sub>1</sub> knotted protein, with a knot encompassing most of the structure (<xref ref-type="fig" rid="F1">Figure 1A</xref>). We found this architecture (PF00194-PF00194) in 686 protein sequences (131 AlphaFold models with 3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub> can be found in the AlphaKnot database. The difference in the number may be due to the fact that several sequences may be too short to form double knot). Importantly, carbonic anhydrases can form disulfide bridges. These bridges can be formed both within a single chain, thereby creating a lasso that stabilizes a shallow knot (<xref ref-type="bibr" rid="B13">Dabrowski-Tumanski et al. 2016a</xref>; <xref ref-type="bibr" rid="B41">Niewieczerza&#x142; and Sulkowska 2019</xref>; <xref ref-type="bibr" rid="B39">Niemyska et al., 2020</xref>). They can also be formed between the monomers forming a dimer (<xref ref-type="bibr" rid="B1">Alterio et al. 2009</xref>; <xref ref-type="bibr" rid="B18">De Simone and Supuran 2010</xref>).</p>
</sec>
<sec id="s3-2">
<title>3.2 The Ca<sup>2&#x2b;</sup>: Cation Antiporter (CaCA) family&#x2014;transmembrane protein</title>
<p>This family of membrane transporters already contains known knotted proteins, such as Vacuolar cation/proton exchanger (CAX) with a 3<sub>1</sub> knot (<xref ref-type="bibr" rid="B29">Jarmolinska et al., 2019</xref>). This protein has two PF01699 domains that together form a knot. Here, we found proteins with four such domains which indicate that they could possess two knots within their structure. This architecture (PF01699-PF01699-PF01699-PF01699) is present in 24 proteins (<xref ref-type="table" rid="T1">Table 1</xref>) and none of them has a resolved structure. <xref ref-type="fig" rid="F1">Figure 1B</xref> shows a structure we predicted with AlphaFold (RoseTTaFold also predicted two knots in this protein). Other proteins from this group with the potential to be doubly knotted are listed in the supplement (<xref ref-type="sec" rid="s10">Supplementary Table S1</xref>).</p>
</sec>
<sec id="s3-3">
<title>3.3 The SPOUT family</title>
<p>Apart from the TrmD-Tm1570 proteins that we describe in more detail below, the SPOUT family contains at least two different architectures also forming a composite 3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub> knot (<xref ref-type="table" rid="T1">Table 1</xref>). Most probably they are a result of gene duplication&#x2014;the gene coding the knot-containing domain fused with its duplicate resulting in a double knotted protein. Individual SPOUT families (Pfam ID) shown in <xref ref-type="table" rid="T1">Table 1</xref> represent the MT domain, which functions as a single protein in many organisms (<xref ref-type="bibr" rid="B23">Hou et al., 2017</xref>). The common structural feature among all of the structures we predicted is the fact that the duplicated domains are interacting <italic>via</italic> the vast interface (<xref ref-type="fig" rid="F1">Figures 1C, D</xref>). Furthermore, the arrangement of the domains is identical to that formed by single-domain proteins in their homodimeric complex (<xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>).</p>
<sec id="s3-3-1">
<title>3.3.1 PF00588-PF00588&#x2014;the largest group of doubly knotted proteins</title>
<p>The PF00588 is a large protein family with over 35,000 sequences of MTs modifying 2&#x2019;O of ribose in either tRNA or rRNA. The PF00588-PF00588 fusion proteins form the biggest group of the doubly knotted proteins we found. Interestingly, we encountered proteins with this architecture using domain annotations in Pfam (118 hits) and structure searches in AlphaKnot (seven hits). Since these seven proteins do not have both domains annotated in the Pfam database, we used HHpred to obtain them (<xref ref-type="sec" rid="s10">Supplementary Table S2</xref>).</p>
<p>Both domains of this architecture contain a compact 3<sub>1</sub> knot, which is characteristic of the SPOUT superfamily. All seven models look like a fused dimeric complex of a knotted MT (<xref ref-type="fig" rid="F1">Figure 1C</xref>; <xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>) with the domains arranged in a perpendicular fashion, for example, in TrmH (from the same family) or Tm1570 (from PF09936 family) crystal structures (<xref ref-type="bibr" rid="B32">Kim et al., 2009</xref>).</p>
</sec>
<sec id="s3-3-2">
<title>3.3.2 PF03587-PF03587&#x2014;Nep1-Nep1 fusion</title>
<p>There are 34 proteins with the double knot topology and PF03587-PF03587 domain architecture. The PF03587 family groups Ribosomal RNA small subunit MTs NEP1 (Nep1) that methylate pseudouridine at position 1,189 (Psi1189) in 18S rRNA. Most of these proteins function as homodimeric single-domain proteins. The predicted structure of Nep1-Nep1 fusion we found (<xref ref-type="fig" rid="F1">Figure 1D</xref>) resembles the crystal structure of Nep1 dimeric complex (<xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>)&#x2014;similar as in the case of PF00588-PF00588 proteins.</p>
</sec>
<sec id="s3-3-3">
<title>3.3.3 PF01746-PF09936&#x2014;TrmD-Tm1570 fusion</title>
<p>The next group of doubly knotted proteins is formed by the PF01746-PF09936 architecture with both families found within SPOUT knotted MTs. There are a couple of crucial differences between these proteins and the other SPOUT fusions we discussed above: 1) the evolutionary mechanism does not involve gene duplication, 2) in a single chain the two domains interact using a minimal interface, 3) TrmD-Tm1570 is a homodimer, whereas the aforementioned fusion proteins can function as monomers. All of these points are discussed in detail in the sections below.</p>
<p>There are 66 proteins with the PF01746-PF09936 annotation in Pfam and all are present in Bacteria. Within the PF01746 family, there is a well-studied TrmD protein (<xref ref-type="bibr" rid="B26">Ito et al., 2015</xref>) that modifies the N1 position of G37 in tRNA. It is a universal bacterial protein that in a vast majority of organisms is a single-domain protein. In the PF01746-PF09936 architecture, TrmD is fused with Tm1570.</p>
<p>The Tm1570 protein belongs to the SAM-dependent RNA MT family (Pfam ID: PF09936). It contains only 299 proteins and one of them, namely, Tm1570 from <italic>Thermotoga maritima</italic>, has been crystallized (PDB ID: 3dcm). Based on the structure similarity search we performed with Dali (<xref ref-type="bibr" rid="B22">Holm and Laakso, 2016</xref>) using the crystal structure, the protein is most similar to TrmJ MTs that modify cytidine 32&#xa0;at the 2&#x2019;O position in tRNA (<xref ref-type="bibr" rid="B50">Purta et al. 2006</xref>) (<xref ref-type="sec" rid="s10">Supplementary Table S3</xref>). Therefore, it is highly probable that proteins with the PF09936 domain bind tRNA and perform methylation of ribose 2&#x2019;O. Within the whole PF09936 family, two types of domain architecture can be found: a single-domain protein (like Tm1570) or a two-domain protein, which is the TrmD-Tm1570 fusion.</p>
<p>By analyzing the location of the genes coding the domains of both families (Pfam ID: PF01746 and PF09936) in Bacteria, we found four different ways in which the genes are co-located in the genomes: 1) two single genes in different parts of the genome; 2) two single genes adjacent on the genome; 3) two single but overlapping genes; 4) one fused gene. <xref ref-type="fig" rid="F2">Figure 2</xref> shows the arrangement in some example organisms. This might represent the evolutionary pathway that led to the creation of the fusion, which started as two separate genes. Even though we did not find evidence supporting the interaction between single-domain TrmD and Tm1570, we hypothesize that the proteins can form a complex and it was more advantageous for the cell to express them, and in the end to fuse them, together.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Arrangement of TrmD and Tm1570 genes in different organisms. From the top: <italic>Aquifex aeolicus</italic>&#x2014;the genes are separated by thousands of nucleotides; <italic>Desulfobacter postgatei</italic>&#x2014;the genes are 11 nucleotides apart; <italic>Thermotoga maritima</italic>&#x2014;the genes are overlapping by 7 nucleotides; <italic>Calditerrivibrio nitroreducens</italic>&#x2014;the genes are fused.</p>
</caption>
<graphic xlink:href="fmolb-10-1223830-g002.tif"/>
</fig>
<p>Next, to verify the presence of the two knots in these proteins, we predicted their structures from nine different organisms (see <xref ref-type="sec" rid="s10">Supplementary Figure S2</xref>) using AlphaFold 2. None of the nine formed a compact single chain structure as is the case in the other families of double knotted proteins from SPOUT superfamily we analyzed (e.g., Nep1-Nep1; <xref ref-type="fig" rid="F1">Figure 1B</xref>). Instead, the nine form an open conformation with the domains scarcely interacting with each other (<xref ref-type="fig" rid="F1">Figure 1E</xref>). This behavior is expected since the two proteins in their single-domain forms are dimerizing in different ways: TrmD in an antiparallel fashion and Tm1570 in a perpendicular fashion (<xref ref-type="fig" rid="F3">Figure 3</xref>). This suggests that TrmD-Tm1570 functions as a dimer and the domains interact with their counterparts from the other chain.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Predicted structure of CnTrmD-Tm1570 fusion protein based on AlphaFold and docking. This homodimeric (second chain is transparent) complex binds tRNA (green) with its TrmD domains. A single chain of this protein contains two 3<sub>1</sub> knots (marked in blue and red) (<xref ref-type="bibr" rid="B40">Niemyska et al. 2022</xref>). TrmD domain (light grey) interacts with its counterpart from the second chain in an antiparallel fashion, whereas Tm1570 (dark grey) in a perpendicular fashion. Details about the modeled complex are in the <xref ref-type="sec" rid="s2">Methods section</xref>.</p>
</caption>
<graphic xlink:href="fmolb-10-1223830-g003.tif"/>
</fig>
</sec>
</sec>
<sec id="s3-4">
<title>3.4 TrmD-Tm1570 from <italic>Calditerrivibrio nitroreducens</italic>
</title>
<sec id="s3-4-1">
<title>3.4.1 Homodimeric structure</title>
<p>From the set of double knotted proteins we found, we investigated further one from the TrmD-Tm1570 family from <italic>Calditerrivibrio nitroreducens</italic> (<italic>Cn</italic>TrmD-Tm1570). We used this protein to characterize the structural basis for substrate recognition and the overall structural landscape of double knotted proteins.</p>
<p>Our theoretical and experimental analysis shows that the <italic>Cn</italic>TrmD-Tm1570 protein functions as a homodimer, unlike other double knotted proteins we study here. Therefore, we used AlphaFold Multimer to model the structure and obtained a compact homodimeric complex (<xref ref-type="fig" rid="F3">Figure 3</xref>) with the main interchain interactions present between the corresponding domains. Both of the domains interact in a standard fashion (antiparallel for TrmD and perpendicular for Tm1570) with their counterparts from the other chain. To further verify the model we analyzed the dimeric interface of the fusion and compared it with the ones that are created in single-domain TrmDs and Tm1570s. We analyzed all TrmD and Tm1570 structures available in the PDB along with their homologs (<xref ref-type="sec" rid="s10">Supplementary Table S4</xref>) and found key residues that are crucial for the dimeric interface in the single-domain proteins (the sequence similarity between different TrmD proteins is low, although, the structures can be superimposed very well). These amino acids are conserved in both the TrmD and Tm1570 domains of the fusion (<xref ref-type="fig" rid="F4">Figure 4</xref>; <xref ref-type="sec" rid="s10">Supplementary Tables S5, S6</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Comparison of sequence motifs in TrmD and Tm1570 with the fusion protein. WebLogo3 was used to construct the conserved residue logos at the SAM and tRNA binding sites. Cartoon representation shows the TrmD-Tm1570 protein (TrmD domain in green, Tm1570 in blue) with selected motifs marked on the structure.</p>
</caption>
<graphic xlink:href="fmolb-10-1223830-g004.tif"/>
</fig>
<p>Details concerning the mechanism of function, including conformations of the residues in the active site as well as the steps of chemical catalysis, are well understood for TrmD (single-domain proteins) but not for Tm1570. Herein, based on our analysis of structure and sequence, we found that deep trefoil knots provide the binding sites for SAM in both the TrmD and Tm1570 domains of the fusion. Moreover, they are both structurally and sequentially similar to their counterparts from single-domain proteins (<xref ref-type="fig" rid="F4">Figure 4</xref>). Thus the ligand binding modes should be similar in both domains. More precisely, the binding site-forming knot in <italic>Haemophilus influenzae</italic> TrmD (<italic>Hi</italic>TrmD) consists of three loops: the cover (Ser88-Gly91), the wall (Gly113-Ile118), and the bottom loop (Ser132-Gly140) (<xref ref-type="bibr" rid="B30">Jaroensuk et al., 2019</xref>). The residues of the corresponding three loops in the fusion protein are conserved (the cover loop: Asp87-Gly90, the wall: Gly112- Ile117, and the bottom: Ser131-Gly139). The residues Pro88, Gly90, Arg113, Glu115, Gly116, Ser131, Gly133 and Asp134 are strictly conserved and are involved in the TrmD dimeric interactions (<xref ref-type="sec" rid="s10">Supplementary Table S6</xref>). We used this information to obtain the complex of TrmD-Tm1570 with SAM <italic>via</italic> molecular docking. The resulting structure has four SAM molecules (one ligand in one of the four available active sites), each adopting a conformation that is proper and characteristic for the SPOUT superfamily (<xref ref-type="bibr" rid="B47">Perlinska et al., 2020b</xref>) (<xref ref-type="sec" rid="s10">Supplementary Figure S3</xref>).</p>
<p>Finally, based on the known binding mode of tRNA to <italic>Hi</italic>TrmD, we established how the nucleic acid may interact with the <italic>Cn</italic>TrmD-Tm1570 dimer. We found that residues involved in <italic>Hi</italic>TrmD-tRNA interactions are also involved in the fusion (<xref ref-type="fig" rid="F4">Figure 4</xref>). The SGHH motif (residues 198&#x2013;201 in <italic>Hi</italic>TrmD) that interacts with G37 in the substrate tRNAs for the methylation process (<xref ref-type="bibr" rid="B26">Ito et al., 2015</xref>) is present in SGNH form in the <italic>C. nitroreducens</italic> fusion. All of this information strongly suggests that the predicted model correctly demonstrates how the active complex of TrmD-Tm1570 is constructed.</p>
</sec>
<sec id="s3-4-2">
<title>3.4.2 TrmD-Tm1570 is an active tRNA methyltransferase</title>
<p>In order to experimentally assess the activity of the fusion TrmD-Tm1570 from <italic>C. nitroreducens</italic>, we expressed the His-tagged protein in <italic>E. coli</italic> cells. However, the full-length protein, as well as its individual truncated domains encompassing residues 1&#x2013;240 (TrmD) and 241&#x2013;433 (Tm1570) (see <xref ref-type="fig" rid="F5">Figure 5A</xref>), was found in the insoluble fractions even when growing bacteria at low temperatures. Nevertheless, we managed to perform purification under denaturing conditions and obtained large quantities of structured and functional proteins after the final refolding step. Size-exclusion chromatography suggests that all fragments form stable dimers given the retention volumes on the preparative Superdex 75 column (GE Healthcare; <xref ref-type="sec" rid="s10">Supplementary Figure S4</xref>): 56&#xa0;mL for the fusion TrmD-Tm1570 (49.6&#xa0;kDa monomer), 63&#xa0;mL for the TrmD (27.5&#xa0;kDa monomer), and 65&#xa0;mL for the Tm1570 domain (22.1&#xa0;kDa monomer). It is noteworthy that the single-domain <italic>Ec</italic>TrmD (28.4&#xa0;kDa monomer), which was previously characterized as a dimer (<xref ref-type="bibr" rid="B19">Elkins et al., 2003</xref>) and was now expressed for the sake of reference, eluted from the same column at 63&#xa0;mL. Moreover, we were able to obtain small quantities of the soluble Tm1570 protein without unfolding procedures and this protein migrated through the gel filtration column as Tm1570 subjected to <italic>in vitro</italic> renaturation.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Activity of CnTrmD-Tm1570. <bold>(A)</bold> Protein constructs used for the activity assessment. <bold>(B)</bold> Time-course of the reaction catalyzed by fusion TrmD-Tm1570 (50&#xa0;nM) in the presence of SAM (30&#xa0;<italic>&#x3bc;</italic>M) towards the 8&#xa0;<italic>&#x3bc;</italic>M tRNA Leu (CAG) substrate (<italic>E. coli</italic> tRNA black triangles, <italic>C. nitroreducens</italic> tRNA black circles). <bold>(C)</bold> Relative activities of different TrmD-Tm1570 constructs. Data obtained for the mutated tRNA substrate and negative control are also included. Reaction conditions are the same as in <bold>(B)</bold>.</p>
</caption>
<graphic xlink:href="fmolb-10-1223830-g005.tif"/>
</fig>
<p>We tested the MT activity of the recombinant TrmD-Tm1570 using the commercially available MTase-Glo kit (Promega), which allows one to monitor the S-Adenosyl-L-homocysteine (SAH) concentration build-up during the enzymatic reaction. First, we used tRNA Leu (CAG) from <italic>E. coli</italic> (see <xref ref-type="sec" rid="s10">Supplementary Figure S5</xref> for exact sequence) as the acceptor of the methyl moiety. It turned out that <italic>Cn</italic>TrmD-Tm1570 fusion protein was able to efficiently modify this cloverleaf structure in the presence of SAM. However, as seen in <xref ref-type="fig" rid="F5">Figure 5B</xref>, the same reaction was almost two times faster when the native <italic>C. nitroreducens</italic> substrate, homologous to <italic>E. coli</italic> tRNA Leu (CAG), was used (see <xref ref-type="sec" rid="s10">Supplementary Figure S5</xref>). Although the key nucleotides, including the G37G38 motif, are conserved in both tRNA sequences, not surprisingly TrmD-Tm1570 shows preference towards its native substrate, originating from the same organism as the protein. To verify the importance of the aforementioned G37G38 motif for the reaction catalyzed by TrmD-Tm1570 we also prepared a mutant of <italic>C. nitroreducens</italic> tRNA Leu (CAG), where the guanosine at position 37 was replaced by thymine at the level of the DNA template. As expected for this substrate, the double knotted enzyme showed no activity, comparable to the negative control lacking SAM in the reaction mixture. The activity towards the mutated substrate is higher (at least twice) than control (<xref ref-type="fig" rid="F5">Figure 5C</xref>).</p>
<p>Since we wanted to examine the contribution of both domains to the overall activity of the fusion TrmD-Tm1570 protein, we followed the reaction catalyzed by truncated versions of the full-length protein. With respect to the native <italic>C. nitroreducens</italic> tRNA Leu (CAG) substrate, the TrmD domain retained 86% &#xb1; 4% activity of the fusion protein, while Tm1570 retained only 18% &#xb1; 9% (see <xref ref-type="fig" rid="F5">Figure 5C</xref>). These data clearly demonstrate that the enzymatic activity of the fusion TrmD-Tm1570 protein towards tRNA Leu (CAG) substrate is governed by the TrmD domain. However, the Tm1570 domain may contribute to substrate binding and increase the stability of the complex. On the other hand, small activity of the isolated Tm1570, comparable to the negative control which had SAM omitted from the reaction mixture, may suggest that this protein, whose physiological function remains unknown, is a tRNA methyltransferase but with different substrate specificity. It is also possible that Tm1570 regains its full activity in the presence of a specific ligand or under yet-to-be-discovered conditions.</p>
</sec>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<title>4 Conclusion</title>
<p>Answering the question from the title: yes, proteins with double knots do exist. Here, for the first time we found and analyzed in-depth such proteins. All of them have two 3<sub>1</sub> knots and come from three different protein superfamilies (five distinct architectures). They are either transmembrane ion transporters (from the <italic>Ca</italic>
<sup>2&#x2b;</sup>: Cation Antiporter family), carbonic anhydrases, or methyltransferases (from the SPOUT family). Within the SPOUT group, there are three architectures in proteins with either two duplicated domains (PF00588-PF00588 and PF03587-PF03587) or two separate domains (PF01746-PF09936&#x2014;TrmD-Tm1570). We found that these two groups differ in terms of structure organization&#x2014;the duplicated and fused domains form dimer-like single chain structures, whereas the TrmD-Tm1570 proteins need two chains to resemble a functional SPOUT MT (which are mostly dimers).</p>
<p>Using both theoretical and experimental approaches we studied in detail TrmD-Tm1570&#x2014;a fusion between TrmD and Tm1570 proteins found in 66 organisms. Based on <italic>C. nitroreducens</italic> we established that the protein is a homodimer capable of binding four ligands (S-adenosylmethionine)&#x2014;one in each knotted binding site, and a single tRNA molecule (based on the similarities with <italic>Hi</italic>TrmD). Moreover, the <italic>Cn</italic>TrmD-Tm1570 is folding and functioning <italic>in vitro</italic>&#x2014;it methylates tRNA using its TrmD domain. Unfortunately, we were not able to determine the function of the Tm1570 domain&#x2014;which is unknown for single-domain proteins as well. However, based on structural similarities, we believe that it also acts as a tRNA MT, probably by modifying 2&#x2019;O in ribose. During the preparation of this manuscript, we were able to solve experimentally the structure of <italic>Cn</italic>TrmD-Tm1570 protein and deposit it in the PDB (PDB id: 8b1n) (<xref ref-type="bibr" rid="B12">da Silva et al., 2023</xref>). Our model and the crystal structure are similar, in particular, both of them show &#x201c;open&#x201d; domain organization that enables homodimer formation.</p>
<p>Herein, we have identified proteins with knotted 3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub> structure, composed of two sequential trefoils. A natural question is whether more complicated composite knots also exist in nature. In our search we have not identified any other more complicated sequential pairs (involving other knots than two trefoils). However, another hypothetically possible (albeit quite unlikely) structure involves one trefoil knot formed within another trefoil. Identification of such a structure would require much more sophisticated search; if such a structure exists, it would very likely have even more complex functional properties. Another method would need to be employed to find such a structure, because the methods used in this research are specific to the case of sequential trefoils.</p>
<p>Note that our research was conducted based on the sequences of all known knotted proteins (domains) (<xref ref-type="bibr" rid="B15">Dabrowski-Tumanski et al., 2019</xref>), including predicted knotted proteins (<xref ref-type="bibr" rid="B45">Perlinska et al., 2023</xref>) based on the results of AlphaFold 2 till the end of June 2022. During the preparation of this manuscript, a paper by <xref ref-type="bibr" rid="B6">Brems et al. (2022)</xref> was published showing the composite knots in AlphaFold structures of SPOUT methyltransferases and carbonic anhydrases. Moreover, given that new primary knots are being identified in structures predicted by AlphaFold <xref ref-type="bibr" rid="B40">Niemyska et al. (2022)</xref>, we predict that different types of composite knots exist in nature, and their identification is an important task for future research.</p>
<p>Finally, let us comment on folding of proteins with 3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub> knots. Based on known folding pathways of proteins from SPOUT family one could imagine knotting the N-terminal chain directly on the ribosome (<xref ref-type="bibr" rid="B10">Chwastyk and Cieplak, 2015</xref>; <xref ref-type="bibr" rid="B14">Dabrowski-Tumanski et al., 2018</xref>; <xref ref-type="bibr" rid="B3">Baiesi et al., 2019</xref>), while the C-terminal knot could follow a well known slipknot pathway (<xref ref-type="bibr" rid="B60">Wallin et al., 2007</xref>; <xref ref-type="bibr" rid="B52">Sulkowska et al., 2009</xref>) or other mechanisms suggested for proteins with a deep knot based on numerical simulations (<xref ref-type="bibr" rid="B49">Potestio et al., 2010</xref>; <xref ref-type="bibr" rid="B34">Li et al., 2012</xref>). Another possibility is to use flipping mechanism observed in numerical simulations for proteins with, e.g., 6<sub>1</sub> knot (<xref ref-type="bibr" rid="B5">B&#xf6;linger et al., 2010</xref>). This mechanism was later developed to a topological descriptor of knot folding by <xref ref-type="bibr" rid="B21">Flapan et al. (2019)</xref>. One could extend this scenario to explain folding of newly identified proteins with no-twist types of knots, such as 6<sub>3</sub> recently predicted based on AlphaFold approach (<xref ref-type="bibr" rid="B46">Perlinska et al., 2022</xref>). However, it is not clear how to use it directly to 3<sub>1</sub>
<italic>&#x23;</italic>3<sub>1</sub> knots; moreover, in the case of all doubly knotted proteins listed in this work, we do not see loops responsible for flipping. Reconstructing a folding pathway of composite knots is also an important task for future research.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>AP and JS: investigation and writing&#x2014;original manuscript. AP and MN: formal analysis, methodology, validation, visualization, and writing&#x2014;review and editing. SP: formal analysis, investigation. ES, IL, AB: conducting experimental investigation. AB, EP, and JB: editing of the revised manuscript. RA: conceptualization, data curation and writing&#x2014;original manuscript. JB and EP: conceptualization of experimental part. JS: conceptualization, data curation, formal analysis, investigation, methodology, project administration, resources, supervision, validation, visualization, and writing&#x2014;review and editing. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This work was supported by the National Science Centre &#x23;UMO-2018/31/B/NZ1/04016, 2020/39/I/NZ1/03582 and 2021/43/I/NZ1/03341 to JS.</p>
</sec>
<ack>
<p>This research was carried out with the support of the Interdisciplinary Centre for Mathematical and Computational Modelling, University of Warsaw under computational allocation no GS82-12 and COST EUTOPIA action.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmolb.2023.1223830/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmolb.2023.1223830/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alterio</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Hilvo</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Di Fiore</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Supuran</surname>
<given-names>C. T.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Parkkila</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Crystal structure of the catalytic domain of the tumor-associated human carbonic anhydrase ix</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>106</volume>, <fpage>16233</fpage>&#x2013;<lpage>16238</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0908301106</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baek</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>DiMaio</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Anishchenko</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Dauparas</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ovchinnikov</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>G. R.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Accurate prediction of protein structures and interactions using a three-track neural network</article-title>. <source>Science</source> <volume>373</volume>, <fpage>871</fpage>&#x2013;<lpage>876</lpage>. <pub-id pub-id-type="doi">10.1126/science.abj8754</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baiesi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Orlandini</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Seno</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Trovato</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Sequence and structural patterns detected in entangled proteins reveal the importance of co-translational folding</article-title>. <source>Sci. Rep.</source> <volume>9</volume>, <fpage>8426</fpage>&#x2013;<lpage>8512</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-44928-3</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Berman</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Westbrook</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Gilliland</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Bhat</surname>
<given-names>T. N.</given-names>
</name>
<name>
<surname>Weissig</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2000</year>). <article-title>The protein data bank</article-title>. <source>Nucleic Acids Res.</source> <volume>28</volume>, <fpage>235</fpage>&#x2013;<lpage>242</lpage>. <pub-id pub-id-type="doi">10.1093/nar/28.1.235</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>B&#xf6;linger</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Su&#x142;kowska</surname>
<given-names>J. I.</given-names>
</name>
<name>
<surname>Hsu</surname>
<given-names>H.-P.</given-names>
</name>
<name>
<surname>Mirny</surname>
<given-names>L. A.</given-names>
</name>
<name>
<surname>Kardar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Onuchic</surname>
<given-names>J. N.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>A Stevedore&#x2019;s protein knot</article-title>. <source>PLoS Comput. Biol.</source> <volume>6</volume>, <fpage>e1000731</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1000731</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brems</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Runkel</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yeates</surname>
<given-names>T. O.</given-names>
</name>
<name>
<surname>Virnau</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>AlphaFold predicts the most complex protein knot and composite protein knots</article-title>. <source>Protein Sci.</source> <volume>31</volume>, <fpage>e4380</fpage>. <pub-id pub-id-type="doi">10.1002/pro.4380</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buljan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Frankish</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bateman</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Quantifying the mechanisms of domain gain in animal proteins</article-title>. <source>Genome Biol.</source> <volume>11</volume>, <fpage>R74</fpage>&#x2013;<lpage>R15</lpage>. <pub-id pub-id-type="doi">10.1186/gb-2010-11-7-r74</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chia</surname>
<given-names>J.-M.</given-names>
</name>
<name>
<surname>Kolatkar</surname>
<given-names>P. R.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Implications for domain fusion protein-protein interactions based on structural information</article-title>. <source>BMC Bioinforma.</source> <volume>5</volume>, <fpage>161</fpage>&#x2013;<lpage>167</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-5-161</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christian</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sakaguchi</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Perlinska</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Lahoud</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ito</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>E. A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Methyl transfer by substrate signaling from a knotted protein fold</article-title>. <source>Nat. Struct. Mol. Biol.</source> <volume>23</volume>, <fpage>941</fpage>&#x2013;<lpage>948</lpage>. <pub-id pub-id-type="doi">10.1038/nsmb.3282</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chwastyk</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cieplak</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Cotranslational folding of deeply knotted proteins</article-title>. <source>J. Phys. Condens. Matter</source> <volume>27</volume>, <fpage>354105</fpage>. <pub-id pub-id-type="doi">10.1088/0953-8984/27/35/354105</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Consortium</surname>
<given-names>T. U.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>UniProt: the universal protein knowledgebase in 2021</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D480</fpage>&#x2013;<lpage>D489</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa1100</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>da Silva</surname>
<given-names>F. B.</given-names>
</name>
<name>
<surname>Lewandowska</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Kluza</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Niewieczerzal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Augustyniak</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>First crystal structure of double knotted protein TrmD-Tm1570 &#x2013; inside from degradation perspective</article-title>. <comment>bioRxiv</comment>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.biorxiv.org/content/10.1101/2023.03.13.532328v1">https://www.biorxiv.org/content/10.1101/2023.03.13.532328v1</ext-link>.</comment>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dabrowski-Tumanski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Niemyska</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Pasznik</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2016a</year>). <article-title>Lassoprot: server to analyze biopolymers with lassos</article-title>. <source>Nucleic acids Res.</source> <volume>44</volume>, <fpage>W383</fpage>&#x2013;<lpage>W389</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw308</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dabrowski-Tumanski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Piejko</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Niewieczerzal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Stasiak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Protein knotting by active threading of nascent polypeptide chain exiting from the ribosome exit channel</article-title>. <source>J. Phys. Chem. B</source> <volume>122</volume>, <fpage>11616</fpage>&#x2013;<lpage>11625</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jpcb.8b07634</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dabrowski-Tumanski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Rubach</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Goundaroulis</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dorier</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Su&#x142;kowski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Millett</surname>
<given-names>K. C.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>KnotProt 2.0: a database of proteins with knots and other entangled structures</article-title>. <source>Nucleic Acids Res.</source> <volume>47</volume>, <fpage>D367</fpage>&#x2013;<lpage>D375</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky1140</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dabrowski-Tumanski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Stasiak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2016b</year>). <article-title>In search of functional advantages of knots in proteins</article-title>. <source>PloS One</source> <volume>11</volume>, <fpage>e0165986</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0165986</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Das</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Hoang</surname>
<given-names>Q. Q.</given-names>
</name>
<name>
<surname>Kreinbring</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Luchansky</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Meray</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Ray</surname>
<given-names>S. S.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Structural basis for conformational plasticity of the Parkinson&#x2019;s disease-associated ubiquitin hydrolase uch-l1</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>103</volume>, <fpage>4675</fpage>&#x2013;<lpage>4680</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0510403103</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Simone</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Supuran</surname>
<given-names>C. T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Carbonic anhydrase ix: biochemical and crystallographic characterization of a novel antitumor target</article-title>. <source>Biochimica Biophysica Acta (BBA)-Proteins Proteomics</source> <volume>1804</volume>, <fpage>404</fpage>&#x2013;<lpage>409</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbapap.2009.07.027</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dzubiella</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Tightening and Untying the Knot in Human Carbonic Anhydrase III</article-title>. <source>J. Phys. Chem. Lett.</source> <volume>4</volume> (<issue>11</issue>), <fpage>1829</fpage>&#x2013;<lpage>1833</lpage>. <pub-id pub-id-type="doi">10.1021/jz400748b</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elkins</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Watts</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Zalacain</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>van Thiel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Vitazka</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Redlak</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2003</year>). <article-title>Insights into catalysis by a knotted TrmD tRNA methyltransferase</article-title>. <source>J. Mol. Biol.</source> <volume>333</volume>, <fpage>931</fpage>&#x2013;<lpage>949</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2003.09.011</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eriksson</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Liljas</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Refined structure of human carbonic anhydrase ii at 2.0 &#xe5; resolution</article-title>. <source>Proteins Struct. Funct. Bioinforma.</source> <volume>4</volume>, <fpage>274</fpage>&#x2013;<lpage>282</lpage>. <pub-id pub-id-type="doi">10.1002/prot.340040406</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Flapan</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Topological descriptions of protein folding</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>116</volume>, <fpage>9360</fpage>&#x2013;<lpage>9369</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1808312116</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Holm</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Laakso</surname>
<given-names>L. M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Dali server update</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume>, <fpage>W351</fpage>&#x2013;<lpage>W355</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw357</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hou</surname>
<given-names>Y.-M.</given-names>
</name>
<name>
<surname>Matsubara</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Takase</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Masuda</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>TrmD: a methyl transferase for tRNA methylation with m1G37</article-title>. <source>Enzym.</source> <volume>41</volume>, <fpage>89</fpage>&#x2013;<lpage>115</lpage>. <pub-id pub-id-type="doi">10.1016/bs.enz.2017.03.003</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Niu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>CD-HIT Suite: a web server for clustering and comparing biological sequences</article-title>. <source>Bioinformatics</source> <volume>26</volume>, <fpage>680</fpage>&#x2013;<lpage>682</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq003</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hubbard</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Thornton</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>1993</year>). <source>Naccess. Computer program</source>. <publisher-loc>London</publisher-loc>: <publisher-name>Department of Biochemistry and Molecular Biology, University College</publisher-name>.</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ito</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Masuda</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Yoshida</surname>
<given-names>K.-i.</given-names>
</name>
<name>
<surname>Goto-Ito</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sekine</surname>
<given-names>S.-i.</given-names>
</name>
<name>
<surname>Suh</surname>
<given-names>S. W.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Structural basis for methyl-donor&#x2013;dependent and sequence-specific binding to tRNA substrates by knotted methyltransferase TrmD</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>112</volume>, <fpage>E4197</fpage>&#x2013;<lpage>E4205</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1422981112</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jamroz</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Niemyska</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Rawdon</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Stasiak</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Millett</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Su&#x142;kowski</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>KnotProt: a database of proteins with knots and slipknots</article-title>. <source>Nucleic Acids Res.</source> <volume>43</volume>, <fpage>D306</fpage>&#x2013;<lpage>D314</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku1059</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jarmolinska</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Gambin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Knot_pull&#x2014;python package for biopolymer smoothing and knot detection</article-title>. <source>Bioinformatics</source> <volume>36</volume>, <fpage>953</fpage>&#x2013;<lpage>955</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz644</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jarmolinska</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Perlinska</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Runkel</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Trefz</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ginn</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Virnau</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Proteins&#x2019; knotty problems</article-title>. <source>J. Mol. Biol.</source> <volume>431</volume>, <fpage>244</fpage>&#x2013;<lpage>257</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2018.10.012</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jaroensuk</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>Y. H.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Liew</surname>
<given-names>C. W.</given-names>
</name>
<name>
<surname>Maenpuen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sahili</surname>
<given-names>A. E.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Crystal structure and catalytic mechanism of the essential m1G37 tRNA methyltransferase TrmD from <italic>Pseudomonas aeruginosa</italic>
</article-title>. <source>RNA</source> <volume>25</volume>, <fpage>1481</fpage>&#x2013;<lpage>1496</lpage>. <pub-id pub-id-type="doi">10.1261/rna.066746.118</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jumper</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Evans</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pritzel</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Figurnov</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ronneberger</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Highly accurate protein structure prediction with AlphaFold</article-title>. <source>Nature</source> <volume>596</volume>, <fpage>583</fpage>&#x2013;<lpage>589</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-021-03819-2</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>H. S.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Suh</surname>
<given-names>S. W.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Crystal structure of Thermotoga maritima SPOUT superfamily RNA methyltransferase Tm1570 in complex with S-adenosyl-L-methionine</article-title>. <source>Proteins Struct. Funct. Bioinforma.</source> <volume>74</volume>, <fpage>245</fpage>&#x2013;<lpage>249</lpage>. <pub-id pub-id-type="doi">10.1002/prot.22249</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Richards</surname>
<given-names>F. M.</given-names>
</name>
</person-group> (<year>1971</year>). <article-title>The interpretation of protein structures: estimation of static accessibility</article-title>. <source>J. Mol. Biol.</source> <volume>55</volume>, <fpage>379</fpage>&#x2013;<lpage>400</lpage>. <pub-id pub-id-type="doi">10.1016/0022-2836(71)90324-x</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Terakawa</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Takada</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Energy landscape and multiroute folding of topologically complex proteins adenylate kinase and 2ouf-knot</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>109</volume>, <fpage>17789</fpage>&#x2013;<lpage>17794</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1201807109</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lua</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Grosberg</surname>
<given-names>A. Y.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Statistics of knots, geometry of conformations, and evolution of proteins</article-title>. <source>PLoS Comput. Biol.</source> <volume>2</volume>, <fpage>e45</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.0020045</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Madeira</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Pearce</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tivey</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Basutkar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Edbali</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Search and sequence analysis tools services from EMBL-EBI in 2022</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>W276</fpage>&#x2013;<lpage>W279</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkac240</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marsh</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Hern&#xe1;ndez</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hall</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Ahnert</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Perica</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Robinson</surname>
<given-names>C. V.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Protein complexes are under evolutionary selection to assemble via ordered pathways</article-title>. <source>Cell</source> <volume>153</volume>, <fpage>461</fpage>&#x2013;<lpage>470</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2013.02.044</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mistry</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chuguransky</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Qureshi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Salazar</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Sonnhammer</surname>
<given-names>E. L.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Pfam: the protein families database in 2021</article-title>. <source>Nucleic Acids Res.</source> <volume>49</volume>, <fpage>D412</fpage>&#x2013;<lpage>D419</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkaa913</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Niemyska</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Millett</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Gln: a method to reveal unique properties of lasso type topology in proteins</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>15186</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-71874-2</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Niemyska</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Rubach</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gren</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Garstka</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Bruno da Silva</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>AlphaKnot: server to analyze entanglement in structures predicted by AlphaFold methods</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>W44</fpage>&#x2013;<lpage>W50</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkac388</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Niewieczerza&#x142;</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Supercoiling in a protein increases its stability</article-title>. <source>Phys. Rev. Lett.</source> <volume>123</volume>, <fpage>138102</fpage>. <pub-id pub-id-type="doi">10.1103/PhysRevLett.123.138102</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Okonechnikov</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Golosova</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Fursov</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Team</surname>
<given-names>U.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Unipro UGENE: a unified bioinformatics toolkit</article-title>. <source>Bioinformatics</source> <volume>28</volume>, <fpage>1166</fpage>&#x2013;<lpage>1167</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts091</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pasek</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Risler</surname>
<given-names>J.-L.</given-names>
</name>
<name>
<surname>Br&#xe9;zellec</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Gene fusion/fission is a major contributor to evolution of multi-domain bacterial proteins</article-title>. <source>Bioinformatics</source> <volume>22</volume>, <fpage>1418</fpage>&#x2013;<lpage>1423</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btl135</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perlinska</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Kalek</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Christian</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>Y.-M.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2020a</year>). <article-title>Mg2&#x2b;-Dependent methyl transfer by a knotted protein: a molecular dynamics simulation and quantum mechanics study</article-title>. <source>ACS Catal.</source> <volume>10</volume>, <fpage>8058</fpage>&#x2013;<lpage>8068</lpage>. <pub-id pub-id-type="doi">10.1021/acscatal.0c00059</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perlinska</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Niemyska</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Gren</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Bukowicki</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nowakowski</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Rubach</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>AlphaFold predicts novel human proteins with knots</article-title>. <source>Protein Sci.</source> <volume>32</volume>, <fpage>e4631</fpage>. <pub-id pub-id-type="doi">10.1002/pro.4631</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>Perlinska</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Niemyska</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Gren</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Rubach</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>New 63 knot and other knots in human proteome from AlphaFold predictions</article-title>. <comment>bioRxiv</comment>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.biorxiv.org/content/10.1101/2021.12.30.474018v1">https://www.biorxiv.org/content/10.1101/2021.12.30.474018v1</ext-link>.</comment>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perlinska</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Stasiulewicz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Nawrocka</surname>
<given-names>E. K.</given-names>
</name>
<name>
<surname>Kazimierczuk</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Setny</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>Restriction of S-adenosylmethionine conformational freedom by knotted protein binding sites</article-title>. <source>PLoS Comput. Biol.</source> <volume>16</volume>, <fpage>e1007904</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1007904</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pettersen</surname>
<given-names>E. F.</given-names>
</name>
<name>
<surname>Goddard</surname>
<given-names>T. D.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>E. C.</given-names>
</name>
<name>
<surname>Couch</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Croll</surname>
<given-names>T. I.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>UCSF ChimeraX: structure visualization for researchers, educators, and developers</article-title>. <source>Protein Sci.</source> <volume>30</volume>, <fpage>70</fpage>&#x2013;<lpage>82</lpage>. <pub-id pub-id-type="doi">10.1002/pro.3943</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Potestio</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Micheletti</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Orland</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Knotted vs. unknotted proteins: evidence of knot-promoting loops</article-title>. <source>PLoS Comput. Biol.</source> <volume>6</volume>, <fpage>e1000864</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1000864</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Purta</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Van Vliet</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Tkaczuk</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Dunin-Horkawicz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mori</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Droogmans</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>The yfhQ gene of <italic>Escherichia coli</italic> encodes a tRNA: cm32/Um32 methyltransferase</article-title>. <source>BMC Mol. Biol.</source> <volume>7</volume>, <fpage>23</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2199-7-23</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sayre</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>T. M.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>N. P.</given-names>
</name>
<name>
<surname>Yeates</surname>
<given-names>T. O.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Protein stabilization in a highly knotted protein polymer</article-title>. <source>Protein Eng. Des. Sel.: PEDS</source> <volume>24</volume> (<issue>8</issue>), <fpage>627</fpage>&#x2013;<lpage>630</lpage>. <pub-id pub-id-type="doi">10.1093/protein/gzr024</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schmidberger</surname>
<given-names>J. W.</given-names>
</name>
<name>
<surname>Wilce</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Weightman</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>Whisstock</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Wilce</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The crystal structure of dehi reveals a new <italic>&#x3b1;</italic>-haloacid dehalogenase fold and active-site mechanism</article-title>. <source>J. Mol. Biol.</source> <volume>378</volume>, <fpage>284</fpage>&#x2013;<lpage>294</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2008.02.035</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
<name>
<surname>Su&#x142;kowski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Onuchic</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Dodging the crisis of folding proteins with knots</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>106</volume>, <fpage>3119</fpage>&#x2013;<lpage>3124</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0811147106</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sulkowska</surname>
<given-names>J. I.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>On folding of entangled proteins: knots, lassos, links and theta-curves</article-title>. <source>Curr. Opin. Struct. Biol.</source> <volume>1</volume>, <fpage>131</fpage>&#x2013;<lpage>141</lpage>. <pub-id pub-id-type="doi">10.1016/j.sbi.2020.01.007</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Taylor</surname>
<given-names>W. R.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>A deeply knotted protein structure and how it might fold</article-title>. <source>Nature</source> <volume>406</volume>, <fpage>916</fpage>&#x2013;<lpage>919</lpage>. <pub-id pub-id-type="doi">10.1038/35022623</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Taylor</surname>
<given-names>W. R.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Protein knots and fold complexity: some new twists</article-title>. <source>Comput. Biol. Chem.</source> <volume>31</volume>, <fpage>151</fpage>&#x2013;<lpage>162</lpage>. <pub-id pub-id-type="doi">10.1016/j.compbiolchem.2007.03.002</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thiruselvam</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Kumarevel</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Karthe</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kuramitsu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yokoyama</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ponnuswamy</surname>
<given-names>M. N.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Crystal structure analysis of a hypothetical protein (mj0366) from methanocaldococcus jannaschii revealed a novel topological arrangement of the knot fold</article-title>. <source>Biochem. Biophysical Res. Commun.</source> <volume>482</volume>, <fpage>264</fpage>&#x2013;<lpage>269</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbrc.2016.11.052</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tkaczuk</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Dunin-Horkawicz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Purta</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bujnicki</surname>
<given-names>J. M.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Structural and evolutionary bioinformatics of the SPOUT superfamily of methyltransferases</article-title>. <source>BMC Bioinforma.</source> <volume>8</volume>, <fpage>73</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-8-73</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Varadi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Anyango</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Deshpande</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Nair</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Natassia</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yordanova</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>AlphaFold Protein Structure Database: massively expanding the structural coverage of protein-sequence space with high-accuracy models</article-title>. <source>Nucleic Acids Res.</source> <volume>50</volume>, <fpage>D439</fpage>&#x2013;<lpage>D444</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkab1061</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wagner</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Brunzelle</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Forest</surname>
<given-names>K. T.</given-names>
</name>
<name>
<surname>Vierstra</surname>
<given-names>R. D.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>A light-sensing knot revealed by the structure of the chromophore-binding domain of phytochrome</article-title>. <source>Nature</source> <volume>438</volume>, <fpage>325</fpage>&#x2013;<lpage>331</lpage>. <pub-id pub-id-type="doi">10.1038/nature04118</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wallin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zeldovich</surname>
<given-names>K. B.</given-names>
</name>
<name>
<surname>Shakhnovich</surname>
<given-names>E. I.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>The folding mechanics of a knotted protein</article-title>. <source>J. Mol. Biol.</source> <volume>368</volume>, <fpage>884</fpage>&#x2013;<lpage>893</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2007.02.035</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>S.-Y.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>HDOCK: a web server for protein&#x2013;protein and protein&#x2013;DNA/RNA docking based on a hybrid strategy</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>W365</fpage>&#x2013;<lpage>W373</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkx407</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yeates</surname>
<given-names>T. O.</given-names>
</name>
<name>
<surname>Norcross</surname>
<given-names>T. S.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>N. P.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Knotted and topologically complex proteins as models for studying folding and stability</article-title>. <source>Curr. Opin. Chem. Biol.</source> <volume>11</volume>, <fpage>595</fpage>&#x2013;<lpage>603</lpage>. <pub-id pub-id-type="doi">10.1016/j.cbpa.2007.10.002</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Koay</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ngo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Nah</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>Y. H.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Targeting the bacterial epitranscriptome for antibiotic development: discovery of novel tRNA-(N1G37) methyltransferase (TrmD) inhibitors</article-title>. <source>ACS Infect. Dis.</source> <volume>5</volume>, <fpage>326</fpage>&#x2013;<lpage>335</lpage>. <pub-id pub-id-type="doi">10.1021/acsinfecdis.8b00275</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>