<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell. Infect. Microbiol.</journal-id>
<journal-title>Frontiers in Cellular and Infection Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell. Infect. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">2235-2988</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fcimb.2021.794529</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cellular and Infection Microbiology</subject>
<subj-group>
<subject>Hypothesis and Theory</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Using Genomics to Shape the Definition of the Agglutinin-Like Sequence (<italic>ALS</italic>) Family in the Saccharomycetales</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Oh</surname><given-names>Soon-Hwan</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/685500"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Schliep</surname><given-names>Klaus</given-names>
</name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Isenhower</surname><given-names>Allyson</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1167154"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rodriguez-Bobadilla</surname><given-names>Rubi</given-names>
</name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Vuong</surname><given-names>Vien M.</given-names>
</name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/1551550/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Fields</surname><given-names>Christopher J.</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/39251"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hernandez</surname><given-names>Alvaro G.</given-names>
</name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/718682"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hoyer</surname><given-names>Lois L.</given-names>
</name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>*</sup></xref>
<uri xlink:href="https://loop.frontiersin.org/people/22685"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Pathobiology, College of Veterinary Medicine, University of Illinois at Urbana-Champaign</institution>, <addr-line>Urbana, IL</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Institute of Environmental Biotechnology, Graz University of Technology</institution>, <addr-line>Graz</addr-line>, <country>Austria</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Biology, Millikin University</institution>, <addr-line>Decatur, IL</addr-line>, <country>United States</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Computer Science, University of Illinois at Urbana-Champaign</institution>, <addr-line>Urbana, IL</addr-line>, <country>United States</country></aff>
<aff id="aff5"><sup>5</sup><institution>Roy J. Carver Biotechnology Center, University of Illinois at Urbana-Champaign</institution>, <addr-line>Urbana, IL</addr-line>, <country>United States</country></aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Priya Uppuluri, University of California, Los Angeles, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Govind Vediyappan, Kansas State University, United States; Ci Fu, University of Toronto, Canada</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Lois L. Hoyer, <email xlink:href="mailto:lhoyer@illinois.edu">lhoyer@illinois.edu</email></p>
</fn>
<fn fn-type="other" id="fn002">
<p>This article was submitted to Fungal Pathogenesis, a section of the journal Frontiers in Cellular and Infection Microbiology</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>14</day>
<month>12</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>11</volume>
<elocation-id>794529</elocation-id>
<history>
<date date-type="received">
<day>13</day>
<month>10</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Oh, Schliep, Isenhower, Rodriguez-Bobadilla, Vuong, Fields, Hernandez and Hoyer</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Oh, Schliep, Isenhower, Rodriguez-Bobadilla, Vuong, Fields, Hernandez and Hoyer</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The <italic>Candida albicans</italic> agglutinin-like sequence (<italic>ALS</italic>) family is studied because of its contribution to cell adhesion, fungal colonization, and polymicrobial biofilm formation. The goal of this work was to derive an accurate census and sequence for <italic>ALS</italic> genes in pathogenic yeasts and other closely related species, while probing the boundaries of the <italic>ALS</italic> family within the Order Saccharomycetales. Bioinformatic methods were combined with laboratory experimentation to characterize 47 novel <italic>ALS</italic> loci from 8 fungal species. AlphaFold predictions suggested the presence of a conserved N-terminal adhesive domain (NT-Als) structure in all Als proteins reported to date, as well as in <italic>S. cerevisiae</italic> alpha-agglutinin (Sag1). <italic>Lodderomyces elongisporus</italic>, <italic>Meyerozyma guilliermondii</italic>, and <italic>Scheffersomyces stipitis</italic> were notable because each species had genes with <italic>C. albicans ALS</italic> features, as well as at least one that encoded a Sag1-like protein. Detection of recombination events between the <italic>ALS</italic> family and gene families encoding other cell-surface proteins such as Iff/Hyr and Flo suggest widespread domain swapping with the potential to create cell-surface diversity among yeast species. Results from the analysis also revealed subtelomeric <italic>ALS</italic> genes, <italic>ALS</italic> pseudogenes, and the potential for yeast species to secrete their own soluble adhesion inhibitors. Information presented here supports the inclusion of <italic>SAG1</italic> in the <italic>ALS</italic> family and yields many experimental hypotheses to pursue to further reveal the nature of the <italic>ALS</italic> family.</p>
</abstract>
<kwd-group>
<kwd>ALS genes</kwd>
<kwd>adhesion</kwd>
<kwd>comparative genomics</kwd>
<kwd>protein structure</kwd>
<kwd>fungi</kwd>
<kwd>repeated sequences</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Institute of Dental and Craniofacial Research<named-content content-type="fundref-id">10.13039/100000072</named-content>
</contract-sponsor>
<counts>
<fig-count count="6"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="94"/>
<page-count count="20"/>
<word-count count="11963"/>
</counts>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>Most knowledge about agglutinin-like sequence (Als) protein structure and function comes from the study of <italic>Candida albicans</italic> (reviewed in <xref ref-type="bibr" rid="B32">Hoyer and Cota, 2016</xref>). <italic>C. albicans</italic> Als proteins are adhesins that promote interactions between fungi and host cells, establishing colonization that provides the opportunity to cause disease. Als proteins also function in <italic>C. albicans</italic> adhesion to abiotic surfaces such as indwelling medical devices, and between fungi and other microbes such as bacteria, seeding polymicrobial biofilm development (<xref ref-type="bibr" rid="B66">Peters et al., 2012</xref>).</p>
<p>Using Als protein features known at the time, <xref ref-type="bibr" rid="B32">Hoyer and Cota (2016)</xref> suggested the NT/T/TR/CT model for proteins in the Als family with each protein possessing an NT-Als adhesive domain (NT; <xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>), followed by a Thr-rich region (T), tandemly repeated sequences (TR), and a C-terminal (CT) domain rich in Ser and Thr. Other key features include a secretory signal peptide and GPI anchor addition sequence that direct the mature protein to &#x3b2;-1,6-glucan crosslinkage in the fungal cell wall (<xref ref-type="bibr" rid="B53">Lu et al., 1994</xref>). Display of the NT-Als adhesive domain on the cell surface is key for its ability to interact with other cells and materials (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>).</p>
<p>The crystallographic structure of the NT-Als adhesive domain revealed protein folding driven by formation of 4 disulfide bonds (8 Cys); an invariant Lys is located at the end of the NT-Als binding pocket (<xref ref-type="bibr" rid="B70">Salgado et al., 2011</xref>). The positively charged Lys establishes a salt bridge with the C-terminal carboxylic acid of an incoming peptide ligand. Als binding affinity is at the micromolar level; avidity of Als protein interactions is increased by a peptide sequence with high &#x3b2;-aggregation potential (called the amyloid-forming region; AFR; <xref ref-type="bibr" rid="B49">Lipke et al., 2018</xref>).</p>
<p>The first <italic>ALS</italic> gene was named for the similarity of its predicted protein to <italic>Saccharomyces cerevisiae</italic> alpha-agglutinin (Sag1; <xref ref-type="bibr" rid="B34">Hoyer et al., 1995</xref>). At that time, considerably less DNA sequence information was available in public databases. Sag1 is an adhesin that promotes cell-cell contact between haploid yeasts during the mating process (<xref ref-type="bibr" rid="B84">Wojciechowicz et al., 1993</xref>). Sag1 binds the carboxyl-terminal peptide of <bold>a</bold>-agglutinin with nanomolar affinity (<xref ref-type="bibr" rid="B7">Cappellaro et al., 1994</xref>; <xref ref-type="bibr" rid="B89">Zhao et al., 2001</xref>). In contrast to Als proteins, the sequence of the N-terminal region of Sag1 has 6 Cys and an Arg residue at the position of the invariant Lys. The structure of Sag1 was not solved experimentally although molecular modeling and biochemical analyses contributed considerable insight into protein function and potential structure (<xref ref-type="bibr" rid="B9">Chen et al., 1995</xref>; <xref ref-type="bibr" rid="B48">Lipke et al., 1995</xref>; <xref ref-type="bibr" rid="B29">Grigorescu et al., 2000</xref>). Despite inherent differences between Als proteins and Sag1, various authors recognized the common features between these proteins and proposed that Sag1 is part of the Als family (<xref ref-type="bibr" rid="B32">Hoyer and Cota, 2016</xref>; <xref ref-type="bibr" rid="B47">Lipke, 2018</xref>).</p>
<p>The rich foundation of experimental evidence from <italic>C. albicans</italic> was used to define <italic>ALS</italic> genes and their encoded proteins in other fungal species including <italic>Candida dubliniensis</italic> (<xref ref-type="bibr" rid="B35">Jackson et al., 2009</xref>), <italic>Candida parapsilosis</italic> (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>), <italic>Candida orthopsilosis</italic> (<xref ref-type="bibr" rid="B52">Lombardi et al., 2019</xref>), <italic>Candida metapsilosis</italic> (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>) and <italic>Candida tropicalis</italic> (<xref ref-type="bibr" rid="B62">Oh et al., 2021</xref>). The burgeoning number of publicly available draft genome sequences provides the opportunity to locate other <italic>ALS</italic> sequences using a simple BLAST search. However, lack of proper gene assembly is a frequent stumbling block due to the tendency for each species to have multiple <italic>ALS</italic> loci and for <italic>ALS</italic> genes to encode long stretches of highly conserved, tandemly repeated sequences. Computer assembly of short-read sequences often breaks down in <italic>ALS</italic> coding regions because the length of repeated sequences is similar to the length of sequence reads (<xref ref-type="bibr" rid="B52">Lombardi et al., 2019</xref>). Emergence of long-read DNA sequencing technology provided datasets with more-accurate <italic>ALS</italic> assemblies, however, PCR amplification and Sanger sequencing are still frequently required to complete <italic>ALS</italic> loci (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>; <xref ref-type="bibr" rid="B62">Oh et al., 2021</xref>).</p>
<p>The initial focus of this work was to derive an accurate census and sequence for the <italic>ALS</italic> genes in the human pathogenic Saccharomycetales species. Closely related species, including some with biotechnological importance, were also studied because their genome sequences are incorporated into available analysis tools (<xref ref-type="bibr" rid="B55">Maguire et al., 2013</xref>). Information presented here expands the list of known <italic>ALS</italic> loci, adding 47 carefully validated genes from 8 fungal species. Four long-read-based genome assemblies were generated. Predicted proteins were evaluated in the context of the model <italic>C. albicans</italic> Als and <italic>S. cerevisiae</italic> Sag1 characteristics. The availability of new, accurate structural prediction tools (<xref ref-type="bibr" rid="B39">Jumper et al., 2021</xref>) provided the opportunity to assess similarities within this group of proteins. Recent release of many new genome sequences for budding yeasts in the subphylum Saccharomycotina (<xref ref-type="bibr" rid="B74">Shen et al., 2018</xref>) allowed new insight into whether <italic>C. albicans</italic> Als proteins and <italic>S. cerevisiae</italic> Sag1 arose from a common ancestor. The resulting information redefines the <italic>ALS</italic> family, its diversity, and taxonomic boundaries. Information presented here also provides the basis for new hypotheses regarding Als protein function.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="s2_1">
<title>Fungal Strain and Public Genome Sequence Resources</title>
<p>To ensure use of authenticated materials, <italic>Lodderomyces elongisporus</italic> strain NRRL YB-4239 and <italic>Spathaspora passalidarum</italic> strain NRRL Y-27907 were obtained from the Agricultural Research Service Culture Collection (Peoria, IL; <uri xlink:href="https://nrrl.ncaur.usda.gov">https://nrrl.ncaur.usda.gov</uri>). <italic>Meyerozyma guilliermondii</italic> strain ATCC 6260 and <italic>Scheffersomyces stipitis</italic> strain CBS 6054 (ATCC 58785) were purchased from the American Type Culture Collection (<uri xlink:href="https://www.atcc.org">https://www.atcc.org</uri>). <xref ref-type="table" rid="T1"><bold>Table 1</bold></xref> lists genome sequences used for this study.</p>
<table-wrap id="T1" position="float">
<label>Table 1</label>
<caption>
<p>Principal genome sequences used for <italic>ALS</italic> gene detection.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Species</th>
<th valign="top" align="center">Strain</th>
<th valign="top" align="center">Assembly Name</th>
<th valign="top" align="center">GenBank Assembly Accession</th>
<th valign="top" align="center">Reference</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>Candida albicans</italic></td>
<td valign="top" align="left">SC5314</td>
<td valign="top" align="left">ASM18296v3</td>
<td valign="top" align="left">GCA_000182965.3</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B38">Jones et al., 2004</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida dubliniensis</italic></td>
<td valign="top" align="left">CD36</td>
<td valign="top" align="left">ASM2694v1</td>
<td valign="top" align="left">GCA_000026945.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B35">Jackson et al., 2009</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida parapsilosis</italic></td>
<td valign="top" align="left">CDC317</td>
<td valign="top" align="left">ASM18276v2</td>
<td valign="top" align="left">GCF_000182765.2</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B6">Butler et al., 2009</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida orthopsilosis</italic></td>
<td valign="top" align="left">Co 90-125</td>
<td valign="top" align="left">ASM31587v1</td>
<td valign="top" align="left">GCA_000315875.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B67">Riccombeni et al., 2012</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM433491v1</td>
<td valign="top" align="left">GCA_004334915.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B52">Lombardi et al., 2019</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida metapsilosis</italic></td>
<td valign="top" align="left">ATCC 96143</td>
<td valign="top" align="left">UIUC_Cmeta_2.0</td>
<td valign="top" align="left">GCA_008904905.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida tropicalis</italic></td>
<td valign="top" align="left">MYA-3404</td>
<td valign="top" align="left">ASM633v3</td>
<td valign="top" align="left">GCA_000006335.3</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B6">Butler et al., 2009</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM694213v1</td>
<td valign="top" align="left">GCA_006942135.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B62">Oh et al., 2021</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM1731540v1</td>
<td valign="top" align="left">GCA_017315405.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B30">Guin et al., 2020</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Meyerozyma guilliermondii</italic></td>
<td valign="top" align="left">ATCC 6260</td>
<td valign="top" align="left">ASM14942v1</td>
<td valign="top" align="left">GCA_000149425.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B6">Butler et al., 2009</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM694215v1</td>
<td valign="top" align="left">GCA_006942155.1</td>
<td valign="top" align="left">This work</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Clavispora lusitaniae</italic></td>
<td valign="top" align="left">ATCC 42720</td>
<td valign="top" align="left">ASM383v1</td>
<td valign="top" align="left">GCA_000003835.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B6">Butler et al., 2009</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Scheffersomyces sitpitis</italic></td>
<td valign="top" align="left">CBS 6054</td>
<td valign="top" align="left">ASM20916v1</td>
<td valign="top" align="left">GCA_000209165.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B36">Jeffries et al., 2007</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM694211v1</td>
<td valign="top" align="left">GCA_006942115.1</td>
<td valign="top" align="left">This work</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Debaryomyces hansenii</italic></td>
<td valign="top" align="left">CBS 767</td>
<td valign="top" align="left">ASM644v2</td>
<td valign="top" align="left">GCA_000006445.2</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B14">Dujon et al., 2004</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Lodderomyces elongisporus</italic></td>
<td valign="top" align="left">NRRL YB-4239</td>
<td valign="top" align="left">ASM14968v1</td>
<td valign="top" align="left">GCA_000149685.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B6">Butler et al., 2009</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM1362098v1</td>
<td valign="top" align="left">GCA_013620985.1</td>
<td valign="top" align="left">This work</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Yamadazyma tenuis</italic></td>
<td valign="top" align="left">ATCC 10573</td>
<td valign="top" align="left">Candida tenuis v1.0</td>
<td valign="top" align="left">GCA_000223465.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B83">Wohlbach et al., 2011</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Spathaspora passalidarum</italic></td>
<td valign="top" align="left">NRRL Y-27907</td>
<td valign="top" align="left">S passalidarum v2.0</td>
<td valign="top" align="left">GCA_000223485.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B83">Wohlbach et al., 2011</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left">ASM1362096v1</td>
<td valign="top" align="left">GCA_013620965.1</td>
<td valign="top" align="left">This work</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Pichia kudriavzevii</italic></td>
<td valign="top" align="left">ATCC 6258</td>
<td valign="top" align="left">ASM305444v1</td>
<td valign="top" align="left">GCA_003054445.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B12">Douglass et al., 2018</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida glabrata</italic></td>
<td valign="top" align="left">CBS138</td>
<td valign="top" align="left">ASM254v2</td>
<td valign="top" align="left">GCA_000002545.2</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B14">Dujon et al., 2004</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left">BG2</td>
<td valign="top" align="left">ASM1421772v1</td>
<td valign="top" align="left">GCA_010111755.1</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B85">Xu et al., 2020</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Saccharomyces cerevisiae</italic></td>
<td valign="top" align="left">S288C</td>
<td valign="top" align="left">R64</td>
<td valign="top" align="left">GCA_000146045.2</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B24">Goffeau et al., 1996</xref>)</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Candida auris</italic></td>
<td valign="top" align="left">B8441</td>
<td valign="top" align="left">Cand_auris_B8441_V2</td>
<td valign="top" align="left">GCA_002759435.2</td>
<td valign="top" align="left"> (<xref ref-type="bibr" rid="B50">Lockhart et al., 2017</xref>)</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_2">
<title>Genome Sequencing and Assembly</title>
<p>New genome assemblies were constructed for <italic>L. elongisporus</italic> NRRL YB-4239 (ASM1362098v1), <italic>M. guilliermondii</italic> ATCC 6260 (ASM6942125v1), <italic>S. stipitis</italic> CBS 6054 (ASM694211v1), and <italic>S. passalidarum</italic> NRRL Y-27907 (ASM362096v1) using a combination of Illumina MiSeq and Oxford Nanopore MinION data. Details of the method and genome assembly are in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplementary Files S1</bold></xref><bold>&#x2013;</bold><xref ref-type="supplementary-material" rid="SM4"><bold>S4</bold></xref>, respectively. Similar methods were described previously (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>; <xref ref-type="bibr" rid="B62">Oh et al., 2021</xref>) and were reproduced here for the reader&#x2019;s convenience.</p>
<p>Fungal cells were stored at -80&#xb0;C and streaked to YPD agar plates (per liter: 10 g yeast extract, 20 g Bacto peptone, 20 g dextrose, 20 g Bacto agar). A single colony was inoculated into YPD liquid medium and the culture grown 16 h at 30&#xb0;C and 200 r/min shaking. Genomic DNA was isolated according to <xref ref-type="bibr" rid="B75">Sherman et al. (1986)</xref>. Briefly, cells were spheroplasted with zymolyase and lysed with sodium dodecyl sulfate. The lysate was&#xa0;extracted with phenol, DNA precipitated with isopropanol, and the final preparation treated with Proteinase K. DNA shearing was minimized by use of wide-bore pipet tips and gentle mixing. Agarose gel electrophoresis was used to verify the presence of high-molecular-weight DNA prior to subsequent library preparation.</p>
<p>Libraries were constructed and sequenced at the Roy J. Carver Biotechnology Center, University of Illinois at Urbana-Champaign. Individually barcoded shotgun libraries were made using the Hyper Library construction kit (Roche) and pooled in equimolar concentration. The pooled libraries were quantitated by qPCR and sequenced on one MiSeq flowcell for 251 cycles from each end of the fragment using a MiSeq 500-cycle sequencing kit (version 2). PhiX DNA was used as a spike-in control for MiSeq sequencing runs. FASTQ files were generated and demultiplexed with bcl2fastq Conversion Software (Illumina, version 2.17.1.14). MiSeq reads were quality trimmed using Trimmomatic v0.36 (<xref ref-type="bibr" rid="B5">Bolger et al., 2014</xref>) to remove adaptors from the 3&#x2019; end of the reads prior to assembly, retaining all reads greater than or equal to 50 nt in length.</p>
<p>Libraries for Oxford Nanopore long-read sequencing used 1 &#x3bc;g of genomic DNA that was sheared in a gTube (Covaris, Woburn, MA, United States) for 1 min at 6,000 r/min in a MiniSpin plus microcentrifuge (Eppendorf, Hauppauge, NY, United States). The sheared DNA was converted to a shotgun library with the LSK-108 kit (Oxford Nanopore) with the Expansion barcoding kit (EXP-NBD103). The libraries were pooled in equimolar concentration and the pool was sequenced on two SpotON MK I (R9.5) flowcells for 48 h using a MinION MK 1B sequencer. Basecalling was done with software MinKNOW version 1.7.7 and demultiplexing was performed with the Albacore software version 1.2.4. Sixty bp were trimmed from each end of the reads to remove barcodes using a custom script.</p>
<p>Detailed assembly steps are outlined in <xref ref-type="supplementary-material" rid="SM1"><bold>Supplemental Files S1</bold></xref><bold>&#x2013;</bold><xref ref-type="supplementary-material" rid="SM4"><bold>S4</bold></xref> for the four genomes. In brief, trimming was performed using a simple Perl script to remove 60 nt from the ends of the reads, retaining reads longer than or equal to 1000 nt for the final assembly. Canu v1.5 (<xref ref-type="bibr" rid="B42">Koren et al., 2017</xref>) was used for assembly with the following parameters: &#x201c;canu -p asm -d useGrid = false -nanopore-raw genomeSize=&lt;GENOME_SIZE&gt; &lt;TRIMMED_FASTQ&gt;&#x201d;, using the relevant quality-trimmed reads from Porechop and the following estimated genome sizes as input: <italic>S. stipitis</italic> = 15.4 Mb, <italic>L. elongisporus</italic> = 15.5 Mb, <italic>M. guilliermondii</italic> = 10.6 Mb, <italic>S. passalidarum</italic> = 13.2 Mb.</p>
<p>Trimmed Oxford Nanopore reads were then aligned against their associated assembly using bwa v0.7.5 (<xref ref-type="bibr" rid="B44">Li, 2018</xref>) by first indexing the assembly using &#x201c;bwa index &lt;ASSEMBLY&gt;&#x201d;, then aligning reads using the parameters &#x201c;bwa mem -x ont2d &lt;ASSEMBLY_INDEX&gt; &lt;TRIMMED_READS&gt;&#x201d;. The alignment was then used to polish the assembly using nanopolish v0.7.1 (<xref ref-type="bibr" rid="B73">Senol Cali et al., 2018</xref>). Quality-trimmed MiSeq data were used to further polish the assembly using Pilon v1.22 for error correction (<xref ref-type="bibr" rid="B82">Walker et al., 2014</xref>). Assembly names and GenBank accession numbers for the genome sequences for <italic>L. elongisporus</italic> NRRL YB-4239, <italic>M. guilliermondii</italic> ATCC 6260, <italic>S. passalidarum</italic> NRRL Y-27907, and <italic>S. stipitis</italic> CBS 6054 are located in <xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>.</p>
</sec>
<sec id="s2_3">
<title>Identification of <italic>ALS</italic> Genes and Predicted Als Protein Features</title>
<p>Methods for identifying <italic>ALS</italic> genes and deducing predicted protein features were nearly identical to those reported in previous publications (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>; <xref ref-type="bibr" rid="B62">Oh et al., 2021</xref>). Details were reproduced here for the reader&#x2019;s convenience. BLAST (<uri xlink:href="https://blast.ncbi.nlm.nih.gov/Blast.cgi">https://blast.ncbi.nlm.nih.gov/Blast.cgi</uri>) was used to identify potential <italic>ALS</italic> genes and Als proteins in the genome sequences (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>). BLAST searches were also conducted using the <italic>Candida</italic> Genome Database (<uri xlink:href="http://www.candidagenome.org">www.candidagenome.org</uri>; <xref ref-type="bibr" rid="B76">Skrzypek et al., 2017</xref>). Query sequences included all <italic>C. albicans ALS</italic> genes as reported by <xref ref-type="bibr" rid="B63">Oh et al. (2019)</xref>. As new <italic>ALS</italic>/Als sequences were identified, they were also used as BLAST queries until search reports failed to reveal new sequences.</p>
<p><italic>ALS</italic> gene sequences were verified or corrected by Sanger sequencing of PCR-amplified products. Primers were designed using the Primer Quest Tool (<uri xlink:href="https://www.idtdna.com">https://www.idtdna.com</uri>) and primers purchased from Integrated DNA Technologies (Coralville, IA). PCR used Q5 High Fidelity DNA Polymerase (New England Biolabs) according to the manufacturer&#x2019;s instructions. Extension time was adjusted to promote amplification of the desired product size. PCR products were purified using the MultiScreen HTS 96-well Filtration System (Millipore), then Sanger sequenced at the Roy J. Carver Biotechnology Center (University of Illinois at Urbana-Champaign). A list of primer sequences is located in <xref ref-type="supplementary-material" rid="ST1"><bold>Supplementary Table S1</bold></xref>.</p>
<p>SignalP-5.0 Server (<uri xlink:href="http://www.cbs.dtu.dk/services/SignalP">http://www.cbs.dtu.dk/services/SignalP</uri>; <xref ref-type="bibr" rid="B61">Nielsen, 2017</xref>) was used to locate putative secretory signal peptides. The Big-PI Fungal Predictor (<uri xlink:href="https://mendel.imp.ac.at/gpi/fungi_server.html">https://mendel.imp.ac.at/gpi/fungi_server.html</uri>; <xref ref-type="bibr" rid="B16">Eisenhaber et al., 2004</xref>) identified potential GPI anchor addition sites. Dotmatcher (<uri xlink:href="http://emboss.bioinformatics.nl/cgi-bin/emboss/dotmatcher">http://emboss.bioinformatics.nl/cgi-bin/emboss/dotmatcher</uri>) was used to detect repeated sequences. The ExPASy Server was used to assess amino acid sequence composition (<uri xlink:href="https://web.expasy.org/protparam">https://web.expasy.org/protparam</uri>; <xref ref-type="bibr" rid="B22">Gasteiger et al., 2005</xref>). European Bioinofrmatics Institute (EMBL-EBI) tools were used for translating nucleotide sequences, sequence alignment, and other general processes (<uri xlink:href="https://www.ebi.ac.uk/services">https://www.ebi.ac.uk/services</uri>; <xref ref-type="bibr" rid="B11">Cook et al., 2017</xref>). &#x3b2;-aggregation potential in amino acid sequences was assessed using Tango (<uri xlink:href="http://tango.crg.es">http://tango.crg.es</uri>; <xref ref-type="bibr" rid="B18">Fernandez-Escamilla et al., 2004</xref>; <xref ref-type="bibr" rid="B68">Rousseau et al., 2006</xref>). All nucleotide sequences were translated with the alternative yeast nuclear code (translation table 12) except those from <italic>C. glabrata</italic> and <italic>S. cerevisiae</italic> which used the standard code (translation table 1). There was disagreement about the translation table for <italic>L. elongisporus</italic>: the NCBI database used translation table 1 even though the species was recognized as part of the CUG clade that translates CUG as Ser instead of Leu (translation table 12; <xref ref-type="bibr" rid="B71">Santos et al., 2011</xref>).</p>
</sec>
<sec id="s2_4">
<title>Phylogenetics Analysis</title>
<p>The kingdom Fungi phylogeny of <xref ref-type="bibr" rid="B45">Li et al. (2021)</xref>, based on 290 genes from 1644 species, was pruned using the R package ape (<xref ref-type="bibr" rid="B65">Paradis and Schliep, 2019</xref>). <italic>C. metapsilosis</italic> was not included in the phylogeny. Because of its close relationship to <italic>C. parapsilosis</italic> and <italic>C. orthopsilosis</italic> (<xref ref-type="bibr" rid="B78">Tavanti et al., 2005</xref>), <italic>C. metapsilosis</italic> was attached at the root of these sister species.</p>
<p>Sequences for phylogenetic analysis were trimmed to include only the NT-Als domain, which has adhesive function (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>). Secretory signal peptide sequences were included in the analysis. Tango (<uri xlink:href="http://tango.crg.es">http://tango.crg.es</uri>; <xref ref-type="bibr" rid="B68">Rousseau et al., 2006</xref>; <xref ref-type="bibr" rid="B18">Fernandez-Escamilla et al., 2004</xref>) was used to define the amyloid-forming region (AFR) that marks the C-terminal end of NT-Als (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>). Sequences that did not encode an AFR were trimmed to a length similar to others in the dataset. Amino acid sequences used for phylogenetic analysis were compiled into <xref ref-type="supplementary-material" rid="SM5"><bold>Supplementary File S5</bold></xref>. Sequences were aligned using MAFFT v7.453 (<xref ref-type="bibr" rid="B41">Katoh and Standley, 2013</xref>). A phylogeny was inferred using the best fit model WAG+G+I and subsequent bootstrap analysis was performed using RAxML-NG (<xref ref-type="bibr" rid="B43">Kozlov et al., 2019</xref>).</p>
</sec>
<sec id="s2_5">
<title>Structural Predictions</title>
<p>Protein structural predictions were derived using AlphaFold (<xref ref-type="bibr" rid="B39">Jumper et al., 2021</xref>), accessed using AlphaFold Colab (<uri xlink:href="https://colab.research.google.com/github/deepmind/alphafold/blob/main/notebooks/AlphaFold.ipynb">https://colab.research.google.com/github/deepmind/alphafold/blob/main/notebooks/AlphaFold.ipynb</uri>). ColabFold (<xref ref-type="bibr" rid="B57">Mirdita et al., 2021</xref>; <uri xlink:href="https://colab.research.google.com/github/sokrypton/ColabFold/blob/main/AlphaFold2.ipynb">https://colab.research.google.com/github/sokrypton/ColabFold/blob/main/AlphaFold2.ipynb</uri>) was used for more-rapid generation of structural prototypes. ColabFold utilized MMSeqs2 (UniRef+Environmental), as well as a custom MSA file constructed using Hhblits Toolkit server (<xref ref-type="bibr" rid="B90">Zimmerman et al., 2018</xref>; <xref ref-type="bibr" rid="B20">Gabler et al., 2020</xref>).</p>
<p>Clustal Omega (<xref ref-type="bibr" rid="B54">Madeira et al., 2019</xref>) was used to align amino acid sequences from <xref ref-type="supplementary-material" rid="SM5"><bold>Supplementary File S5</bold></xref> with those from 4LE8, the Protein Data Bank (<uri xlink:href="https://www.rcsb.org">https://www.rcsb.org</uri>) entry for the crystallographic structure of <italic>C. albicans</italic> NT-Als3 (chain A, 299 amino acids). This molecule did not include the secretory signal peptide at the N-terminal end nor the amyloid-forming region at the C-terminal end. Sequences in <xref ref-type="supplementary-material" rid="SM5"><bold>Supplementary File S5</bold></xref> were trimmed according to the Clustal Omega alignment and the trimmed sequences were used for AlphaFold analysis. Sequences for other fungal cell-surface proteins were included as controls in the structural analysis: <italic>C. albicans</italic> Hyr1 (NCBI Reference Sequence: XP_722183.2, amino acids 21 to 309) and <italic>S. cerevisiae</italic> Flo1 (NCBI Reference Sequence: NP_009424.1; amino acids 25 to 273). Structural visualization and alignments used the PyMOL Molecular Graphics System, Version 2.5.2 (Schr&#xf6;dinger, LLC).</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<title>Results</title>
<sec id="s3_1">
<title>Detection and Assembly of <italic>ALS</italic> Sequences in Eight Fungal Species</title>
<p>Examination of new and existing genome sequence data (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>) provided the information needed to locate, assemble and/or validate the sequence for 47 <italic>ALS</italic> loci (5 from <italic>Lodderomyces elongisporus</italic> NRRL YB-4239; 3 from <italic>Candida auris</italic> B8441; 3 from <italic>Scheffersomyces stipitis</italic> CBS 6054; 4 from <italic>Meyerozyma guilliermondii</italic> ATCC 6260; 29 from <italic>Spathaspora passalidarum</italic> NRRL Y-27907; and 1 each from <italic>Clavispora lusitaniae</italic> ATCC 42720, <italic>Yamadazyma tenuis</italic> ATCC 10573, and <italic>Debaryomyces hansenii</italic> CBS 767). These sequences are presented here in the context of previously described <italic>ALS</italic> loci including 8 from <italic>Candida albicans</italic> SC5314 (<xref ref-type="bibr" rid="B33">Hoyer et al., 2008</xref>), 7 from <italic>Candida dubliniensis</italic> CD36 (<xref ref-type="bibr" rid="B35">Jackson et al., 2009</xref>), 13 from <italic>Candida tropicalis</italic> MYA-3404 (<xref ref-type="bibr" rid="B62">Oh et al., 2021</xref>), 5 from <italic>Candida parapsilosis</italic> CDC 317 (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>), 3 from <italic>Candida orthopsilosis</italic> Co 90-125 (<xref ref-type="bibr" rid="B52">Lombardi et al., 2019</xref>), and 4 from <italic>Candida metapsilosis</italic> ATCC 96143 (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>). <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref> details all gene names, GenBank accession numbers, and predicted protein characteristics. Gene names were taken from locus tags associated with the annotated reference genome for each species. For genes that were not annotated in the reference genome, &#x201c;0.5&#x201d; was added to the name, indicating that the ORF was located between two previously annotated genes. <xref ref-type="fig" rid="f1"><bold>Figure 1</bold></xref> displays the phylogenetic relationship between the species described here.</p>
<fig id="f1" position="float">
<label>Figure 1</label>
<caption>
<p>Phylogenetic tree showing relationships between fungal species used in this study. The tree was pruned from the genome-scale phylogeny of the kingdom Fungi developed by <xref ref-type="bibr" rid="B45">Li et al. (2021)</xref>. The phylogeny was based on 290 concatenated sequences in 1644 species. <italic>C. metapsilosis</italic> was not part of the original analysis and was added to the tree based on its close relationship with <italic>C. parapsilosis</italic> and <italic>C. orthopsilosis</italic> (<xref ref-type="bibr" rid="B78">Tavanti et al., 2005</xref>). All species listed were Phylum Ascomycota, Subphylum Saccharomycotina, Class Saccharomycetes, Order Saccharomycetales. Vertical bars on the right of the image indicate Family designations according to the NCBI Taxonomy Database (<uri xlink:href="https://www.ncbi.nlm.nih.gov/taxonomy">https://www.ncbi.nlm.nih.gov/taxonomy</uri>). Brown = Family <italic>Saccharomycetaceae</italic>, Green = Family <italic>Pichiaceae</italic>, Purple = Family <italic>Debaryomycetaceae</italic>, and Blue = Family <italic>Metschnikowiaceae</italic>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-11-794529-g001.tif"/>
</fig>
<sec id="s3_1_1">
<title><italic>L. elongisporus</italic></title>
<p><italic>L. elongisporus</italic> is an infrequent human pathogen and, as accurately portrayed in <xref ref-type="fig" rid="f1"><bold>Figure 1</bold></xref>, closely related to <italic>C. parapsilosis</italic> (<xref ref-type="bibr" rid="B51">Lockhart et al., 2008</xref>). Two <italic>L. elongisporus</italic> genome sequences were available through the National Center for Biotechnology Information (NCBI; <uri xlink:href="https://www.ncbi.nlm.nih.gov">https://www.ncbi.nlm.nih.gov</uri>) database; both were for strain NRRL YB-4239 (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>). Assembly ASM14968v1 was comprised of 145 contigs arranged into 28 scaffolds (i.e. composed of contigs and gaps that are indicated by insertion of &#x201c;NNN&#x201d;) while ASM1362098v1 had 53 contigs. <italic>ALS</italic> gene names were derived from the original annotation of the reference genome (ASM14968v1). Although a <italic>L. elongisporus</italic> karyotype was not located in the literature, the number of contigs/scaffolds was far higher than an expected number of chromosomes, indicating that the genome assemblies required refinement.</p>
<p>BLAST analysis using <italic>ALS</italic> query sequences consistently revealed 6 <italic>L. elongisporus</italic> loci (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary File S6</bold></xref>). <italic>LeALS734</italic> was located in the middle of a &gt; 3 Mb supercontig in each genome assembly. <italic>LeALS2536</italic>, <italic>LeALS2716</italic> and <italic>LeALS2721</italic> were located in the center of another supercontig in ASM14968v1 with the latter two genes located near each other and transcribed in the same direction (<xref ref-type="fig" rid="f2"><bold>Figure 2</bold></xref>). The remaining genes (<italic>LELG_04272</italic>, <italic>LeALS5708</italic>) were each on their own supercontig.</p>
<fig id="f2" position="float">
<label>Figure 2</label>
<caption>
<p>Schematic of the genome region that included <italic>LeALS2716</italic> and <italic>LeALS2721</italic> from <bold>(A)</bold> assembly ASM14968v1 and <bold>(B)</bold> assembly ASM1362098v1. <bold>(C)</bold> shows the region as represented in the <italic>Candida</italic> Genome Order Browser (CGOB; <uri xlink:href="https://cgob.ucd.ie/">https://cgob.ucd.ie</uri>; <xref ref-type="bibr" rid="B55">Maguire et al., 2013</xref>) based on ASM14968v1 data. <italic>L. elongisporus</italic> information is circled in red; ORF numbers are shown in each rectangle and the direction of transcription indicated by the arrow below. ORFs 02718, 02719, and 02720 featured the <italic>IFF/HYR</italic> repeated sequences that were also found in <italic>LeALS2716</italic> suggesting that ORF 02716 was longer than initially annotated. The large number of repeated sequences complicated genome sequence assembly in this region. The predicted size of <italic>LeALS2716</italic> in ASM1362098v1 was greater than the final PCR-amplified/Sanger-sequenced fragment that was deposited into GenBank (accession number MN893370; green arrow).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-11-794529-g002.tif"/>
</fig>
<p>Proteins predicted from five loci (<italic>LeALS734</italic>, <italic>LeALS2536</italic>, <italic>LeALS2716</italic>, <italic>LeALS2721</italic>, and <italic>LeALS5708</italic>) had features expected for an Als protein including a secretory signal peptide, NT-Als domain, Ser/Thr-rich sequences, and GPI anchor addition site (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>). Although the protein translated from the sixth locus (<italic>LELG_04272</italic>) had tandemly repeated sequences like those in Als proteins, the ORF did not predict an NT-Als domain (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary File S6</bold></xref>). BLAST of sequences N-terminal to the LELG_04272 tandem repeats best matched <italic>M. guilliermondii</italic> PGUG_02520, a 660-amino acid protein of unknown function. The hybrid <italic>LELG_04272</italic> was likely the result of recombination between an <italic>ALS</italic> open reading frame (ORF) and another gene. Such recombination was observed previously between <italic>ALS</italic> and <italic>IFF/HYR</italic> genes in <italic>C. metapsilosis CmALS2265</italic> which encoded an Als N-terminal domain on the stalk of an Iff/Hyr protein (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>). Because LELG_04272 lacked an NT-Als adhesive domain, it was not given an Als family name.</p>
<p>Similar to <italic>C. metapsilosis</italic>, recombination between <italic>ALS</italic> and <italic>IFF/HYR</italic> genes was evident in <italic>L. elongisporus</italic> (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary File S6</bold></xref>). <italic>LeALS734</italic> and <italic>LeALS2716</italic> each had the 5&#x2019; end of an <italic>ALS</italic> gene and the 3&#x2019; end of an <italic>IFF/HYR</italic> gene. Consensus tandem repeat sequences for each locus closely matched that for <italic>CmALS2265</italic> (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>). The remaining <italic>LeALS</italic> genes did not include a central domain of tandemly repeated sequences.</p>
<p>The predicted amino acid sequence of the NT-Als domain was highly conserved between LeAls2536, LeAls2721, and LeAls5708 (70-80% identity; <xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary File S6</bold></xref>). LeAls734 and LeAls2716 were approximately 40% identical to each other and to the other <italic>L. elogisporus</italic> Als proteins. Since the crystallographic structure of <italic>C. albicans</italic> NT-Als3 is known (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>), the CaAls3 sequence was included for comparison to newly characterized proteins. The LeAls proteins were 33-45% identical to the CaAls3 NT-Als sequence.</p>
<p>The incomplete <italic>L. elongisporus</italic> genome assemblies provided multiple opportunities for repairing ORFs. LELG_04272 lacked a GPI anchor addition site in its original annotation in ASM14968v1 (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary File S6</bold></xref>). Primer design, PCR amplification, and Sanger DNA sequencing indicated that the downstream <italic>LELG_04271</italic> was actually the 3&#x2019; end of the <italic>LELG_04272</italic> coding region. The full sequence was deposited into GenBank (accession number OK172378). The region encoding <italic>LeALS2716</italic> and <italic>LeALS2721</italic> was also assembled poorly in the available genome sequences (<xref ref-type="fig" rid="f2"><bold>Figure 2</bold></xref>). Insertion of many NNN (designating unknown sequence) in this region of assembly ASM14968v1 made it difficult to locate the gene boundaries. The size of the verified <italic>LeALS2716</italic> was larger than predicted in assembly ASM14968v1, but smaller than suggested in assembly ASM1362098v1. The difference was possibly attributable to variation in tandem repeat copy number between alleles in the diploid <italic>L. elongisporus</italic>. A similar scenario was encountered for completing the sequence of <italic>LeALS734</italic>: several previously designated ORFs were combined into the final <italic>LeALS734</italic>, yet the sequence deposited into GenBank was shorter than anticipated from the genome assemblies that guided PCR primer design (details not shown).</p>
</sec>
<sec id="s3_1_2">
<title><italic>M. guilliermondii</italic></title>
<p>In addition to its role as a human pathogen, <italic>M. guilliermondii</italic> has applications in bioprocessing (e.g. production of riboflavin and xylitol) and bioremediation (reviewed in <xref ref-type="bibr" rid="B64">Papon et al., 2013</xref>). Eight <italic>M. guilliermondii</italic> genome assemblies were reported in the NCBI database. Two sequences were available for strain ATCC 6260, which was the focus of this work. ASM14942v1 consisted of 71 contigs arranged on 9 scaffolds. ASM694215v1 had 9 contigs.</p>
<p>Two of the 4 <italic>ALS</italic> loci in strain ATCC 6260 (<italic>MgALS2302</italic>, <italic>MgALS3259</italic>) were on the same chromosome, approximately 1.7 Mb away from each other at opposite telomeres, transcribed in opposite directions (<xref ref-type="supplementary-material" rid="SM7"><bold>Supplementary File S7</bold></xref>). The 3&#x2019; end of the 9681-bp <italic>MgALS2302</italic> was located approximately 10 kb from one telomere while the 3&#x2019; end of the 6963-bp <italic>MgAls3259</italic> was about 7 kb from the opposite telomere. The other two <italic>MgALS</italic> loci (<italic>MgALS673</italic> and <italic>MgALS3330</italic>) were each on other large contigs, likely representing <italic>M. guilliermondii</italic> chromosomes.</p>
<p>The coding region for <italic>MgALS3259</italic> predicted two potential start sites, one 60 bp upstream from the other. The second predicted Met start site provided a clear secretory signal peptide and was included in GenBank accession MH753514. <italic>PGUG_03259</italic> (accession number XM_001485480) included the upstream start site instead. Another difference between sequences deduced here and those from the ASM14942v1 assembly included the length of <italic>MgALS2302</italic>. The gene was considerably longer in the current work compared to previous GenBank deposits (9681 bp vs. 3840 bp). The new gene name reflected its inclusion of multiple ORFs (<italic>PGUG_02299</italic>, <italic>PGUG_02300</italic>, <italic>PGUG_02301</italic>, and <italic>PGUG_02302</italic>) and start of the gene in <italic>PGUG_02302</italic>.</p>
<p>Three of the 4 <italic>MgALS</italic> loci had an extensive central region of tandemly repeated sequences that were very similar to consensus repeats from previously characterized <italic>Candida</italic> genes (<xref ref-type="supplementary-material" rid="SM7"><bold>Supplementary File S7</bold></xref>). The most-common repeat unit size was 35 amino acids with a range of 34-36 amino acids. The predicted MgAls2302 and MgAls3259 NT-Als protein sequences were the most similar to each other. They shared 57% identity while other NT-Als comparisons were only about 30% identical.</p>
</sec>
<sec id="s3_1_3">
<title><italic>C. auris</italic></title>
<p>Availability of genome sequences for over 100 isolates of <italic>C. auris</italic> in the NCBI database reflected its emergence as an important pathogen (<xref ref-type="bibr" rid="B13">Du et al., 2020</xref>). Strain B8441 (18 contigs arranged into 15 scaffolds; assembly Cand_auris_B8441_V2) was used for this work (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>). The three <italic>ALS</italic> loci in strain B8441 were on different scaffolds with <italic>CauALS2582</italic> in a subtelomeric location (<xref ref-type="supplementary-material" rid="SM8"><bold>Supplementary File S8</bold></xref>). Only one predicted <italic>C. auris</italic> Als protein (CauAls4112) had a central domain of tandemly repeated (34-39 amino acids) sequences. <italic>C. auris</italic> NT-Als sequences were 38-50% identical to each other and 25-33% identical to <italic>C. albicans</italic> NT-Als3. BLAST searching of other <italic>C. auris</italic> genomes showed that many were missing the <italic>CauALS2582</italic> locus. These observations matched the report of <xref ref-type="bibr" rid="B59">Mu&#xf1;oz et al. (2021)</xref> that described loss of subtelomeric adhesins such as <italic>CauALS2582</italic> in clade II <italic>C. auris</italic> isolates.</p>
</sec>
<sec id="s3_1_4">
<title><italic>S. stipitis</italic></title>
<p><italic>S. stipitis</italic> is studied because of its ability to ferment xylose, and thus its potential to contribute to biofuel production from hemicellulose (<xref ref-type="bibr" rid="B36">Jeffries et al., 2007</xref>). Because <italic>S. stipitis</italic> is within the CUG clade of the Family <italic>Debaryomycetaceae</italic>, the genome of this beetle-associated commensal yeast is often included in comparisons that feature human-pathogenic species (<xref ref-type="bibr" rid="B83">Wohlbach et al., 2011</xref>; <xref ref-type="bibr" rid="B55">Maguire et al., 2013</xref>). The NCBI database included three <italic>S. stipitis</italic> genome sequences: two for strain CBS 6054 (ASM20916v1 = 9 contigs arranged on 8 scaffolds; ASM694211v1 = 30 contigs) and one for strain NRRL Y-7124. Efforts here focused on strain CBS 6054 (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>).</p>
<p>Strain CBS 6054 had three <italic>ALS</italic> loci (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>). Two (<italic>SsALS2386</italic> and <italic>SsALS2786</italic>) were on chromosome 2, approximately 700 kb apart and transcribed in opposite directions (<xref ref-type="supplementary-material" rid="SM9"><bold>Supplementary File S9</bold></xref>). The third (<italic>SsALS4579</italic>) was on chromosome 4. NT domains of the predicted chromosome 2 proteins were 58% identical. However, each was only 27-29% identical to SsAls4579. Both SsAls2386 and SsAls2786 had a central domain of tandemly repeated sequences that resembled those from previously studied <italic>Candida</italic> species.</p>
<p>BLAST searches and text searches of the NCBI database revealed other repeat-containing loci that were annotated as <italic>ALS</italic> genes in assembly ASM20916v1. For example, <italic>PICST_4391</italic> (called &#x201c;<italic>ALS1</italic>&#x201d;) was a fragment of <italic>SsALS2786</italic> described above. <italic>PICST_4539</italic> (called &#x201c;<italic>ALS1.2</italic>&#x201d;) was a fragment of <italic>SsALS2386</italic> and <italic>PICST_31759</italic> (called &#x201c;<italic>ALS6</italic>&#x201d;) corresponded to <italic>SsALS4579</italic>. <italic>PICST_31095</italic>, despite being named &#x201c;<italic>ALS2</italic>&#x201d;, belonged to the <italic>IFF/HYR</italic> family. Another, called &#x201c;<italic>ALS4</italic>&#x201d; (<italic>PICST_30411</italic>), was comprised only of repeated sequences. It was flanked by sequences that contained many stop codons with a low likelihood of encoding a larger ORF. In assembly ASM20916v1, <italic>PICST_30411</italic> was adjacent to an <italic>IFF/HYR</italic> gene in a subteromeric region on chromosome 2.</p>
</sec>
<sec id="s3_1_5">
<title><italic>S. passalidarum</italic></title>
<p>The <italic>S. passalidarum</italic> genome was also sequenced to study xylose metabolism in fungal species (<xref ref-type="bibr" rid="B83">Wohlbach et al., 2011</xref>). Because initial BLAST searching revealed an unusually high number of <italic>ALS</italic> loci in <italic>S. passalidarum</italic>, additional analysis was pursued. Two genome assemblies for strain NRRL Y-27907 were located in the NCBI database (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>). One was created by the DOE Joint Genome Institute (Spathaspora passalidarum v2.0; 26 contigs arranged onto 8 scaffolds) and the other was part of the current work (ASM1362096v1; 10 contigs).</p>
<p>BLAST searching revealed 29 physical loci with sequence similarity to <italic>ALS</italic> genes (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>). Seven of the 8 contigs from assembly Spathaspora passalidarum v2.0 had at least 1 <italic>ALS</italic> locus, and as many as 7 <italic>ALS</italic> loci (<xref ref-type="table" rid="T2"><bold>Table 2</bold></xref>). Four locations featured <italic>ALS</italic> genes adjacent to each other: <italic>SpALS64434</italic> and <italic>SpALS64435</italic> on scaffold 1, <italic>SpALS50348</italic> and <italic>SpALS50349</italic> on scaffold 3, <italic>SpALS153035</italic> and <italic>SpALS153035.5</italic> on scaffold 4, and <italic>SpALS68952</italic> and <italic>SpALS68952.5</italic> on scaffold 8. Two <italic>ALS</italic> genes were subtelomeric: <italic>SpALS131476</italic> on scaffold 1 and <italic>SpALS137089</italic> on scaffold 3.</p>
<table-wrap id="T2" position="float">
<label>Table 2</label>
<caption>
<p>Physical location of <italic>ALS</italic> loci in the <italic>S. passalidarum</italic> NRRL Y-27907 genome.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Scaffold (Size, Mb)</th>
<th valign="top" align="center">Gene Name</th>
<th valign="top" align="center">Approx. Location (nt)*</th>
<th valign="top" align="center">Tsc<sup>&#x2020;</sup></th>
<th valign="top" align="center">Scaffold (Size, Mb)</th>
<th valign="top" align="center">Gene Name</th>
<th valign="top" align="center">Approx. Location (nt)</th>
<th valign="top" align="center">Tsc<sup>&#x2020;</sup></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1 (2.64)</td>
<td valign="top" align="left"><italic>SpALS131476</italic></td>
<td valign="top" align="center">9400</td>
<td valign="top" align="center">R<sup>&#x2021;</sup></td>
<td valign="top" align="center">4 (1.81)</td>
<td valign="top" align="left"><italic>SpALS61022.5</italic></td>
<td valign="top" align="center">69000</td>
<td valign="top" align="center">R</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS64434</italic></bold></td>
<td valign="top" align="center"><bold>1407000</bold></td>
<td valign="top" align="center"><bold>F</bold></td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS152224</italic></td>
<td valign="top" align="center">180000</td>
<td valign="top" align="center">R</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS64435</italic></bold></td>
<td valign="top" align="center"><bold>1411000</bold></td>
<td valign="top" align="center"><bold>F</bold></td>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS153035</italic></bold></td>
<td valign="top" align="center"><bold>876400</bold></td>
<td valign="top" align="center"><bold>F</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS146555</italic></td>
<td valign="top" align="center">1607000</td>
<td valign="top" align="center">F</td>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS153035.5</italic></bold></td>
<td valign="top" align="center"><bold>879600</bold></td>
<td valign="top" align="center"><bold>F</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS138016</italic></td>
<td valign="top" align="center">1122200</td>
<td valign="top" align="center">F</td>
</tr>
<tr>
<td valign="top" align="left">2 (2.12)</td>
<td valign="top" align="left"><italic>SpALS134590</italic></td>
<td valign="top" align="center">189000</td>
<td valign="top" align="center">R</td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS134590.5</italic></td>
<td valign="top" align="center">254000</td>
<td valign="top" align="center">F</td>
<td valign="top" align="center">5 (1.65)</td>
<td valign="top" align="left"><italic>SpALS155003</italic></td>
<td valign="top" align="center">1011000</td>
<td valign="top" align="center">R</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS134426</italic></td>
<td valign="top" align="center">337300</td>
<td valign="top" align="center">F</td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS140483</italic></td>
<td valign="top" align="center">1300300</td>
<td valign="top" align="center">R</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS134874</italic></td>
<td valign="top" align="center">827000</td>
<td valign="top" align="center">R</td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS140900</italic></td>
<td valign="top" align="center">1306000</td>
<td valign="top" align="center">R</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS135549</italic></td>
<td valign="top" align="center">835000</td>
<td valign="top" align="center">R</td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS141433</italic></td>
<td valign="top" align="center">1312800</td>
<td valign="top" align="center">R</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS59511.5</italic></td>
<td valign="top" align="center">940000</td>
<td valign="top" align="center">R</td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="center">6 (1.18)</td>
<td valign="top" align="left"><italic>SpALS156463</italic></td>
<td valign="top" align="center">710700</td>
<td valign="top" align="center">F</td>
</tr>
<tr>
<td valign="top" align="left">3 (2.07)</td>
<td valign="top" align="left"><italic>SpALS137089</italic></td>
<td valign="top" align="center">8400</td>
<td valign="top" align="center">R<sup>&#x2021;</sup></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS49824</italic></td>
<td valign="top" align="center">486000</td>
<td valign="top" align="center">R</td>
<td valign="top" align="center">8 (0.85)</td>
<td valign="top" align="left"><bold><italic>SpALS68952</italic></bold></td>
<td valign="top" align="center"><bold>600000</bold></td>
<td valign="top" align="center"><bold>R</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS136382</italic></td>
<td valign="top" align="center">858000</td>
<td valign="top" align="center">F</td>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS68952.5</italic></bold></td>
<td valign="top" align="center"><bold>604000</bold></td>
<td valign="top" align="center"><bold>R</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS55077</italic></td>
<td valign="top" align="center">1015000</td>
<td valign="top" align="center">F</td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS66147</italic></td>
<td valign="top" align="center">1021200</td>
<td valign="top" align="center">R</td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS50348</italic></bold></td>
<td valign="top" align="center"><bold>1700000</bold></td>
<td valign="top" align="center"><bold>F</bold></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><bold><italic>SpALS50349</italic></bold></td>
<td valign="top" align="center"><bold>1702000</bold></td>
<td valign="top" align="center"><bold>F</bold></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>*Approximate location of each ORF in the Spathaspora passalidarum v2.0 assembly (GCA_000223485.1). Pairs of contiguous ORFs are indicated in bold type.</p>
</fn>
<fn>
<p><sup>&#x2020;</sup>Direction of transcription is noted as F (forward) or R (reverse).</p>
</fn>
<fn>
<p><sup>&#x2021;</sup>Subtelomeric localization.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Examination of the encoded protein sequences showed that many did not have repeated sequences in the center (<xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>). When present, repeated sequences were unusually long (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>), highly variable in the length of the repeat unit, and did not necessarily have tandemly arrayed repeat copies. A consensus of the 80-amino-acid and 89-amino-acid versions of the <italic>S. passalidarum</italic> repeated sequence resembled the T (Thr-rich) domain of <italic>C. albicans</italic> Als proteins that is located between the end of NT-Als and the start of the tandem repeat region (reviewed in <xref ref-type="bibr" rid="B32">Hoyer and Cota, 2016</xref>). Some manuscripts depict this region separately from &#x201c;NT-Als&#x201d; for which the crystal structure is known (e.g. <xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>). Other manuscripts, like this one, include the T domain in the &#x201c;NT-Als +&#x201d; region for each protein.</p>
<p><italic>S. passalidarum</italic> had several partial <italic>ALS</italic> genes (<xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>). In previous analyses, partial <italic>ALS</italic> genes indicated poor genome assembly that could be corrected by PCR amplification and Sanger sequencing (<xref ref-type="bibr" rid="B63">Oh et al., 2021</xref>). Here, however, PCR amplification and Sanger sequencing validated the accuracy of the partial <italic>ALS</italic> genes including the contiguous loci <italic>SpALS50348</italic> and <italic>SpALS50349</italic> that each only encoded an NT-Als domain with a secretory signal peptide. A clear stop codon between <italic>SpALS68952.5</italic> and <italic>SpALS68952</italic> created pseudogenes from a perhaps previously long, functional gene. Some predicted proteins lacked features such as a secretory signal peptide that would direct the protein toward cell-surface localization. Signal-peptide-encoding sequences were noted upstream of <italic>SpALS66147</italic> and <italic>SpALS134590.5</italic> but were separated from the ORF by at least one clear stop codon. Other predicted proteins (SpAls49824, SpAls61022.5, SpAls140483, and SpAls140900; <xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>) showed only a weak signal for GPI anchor addition, suggesting that the mature proteins may not be localized to the cell surface. Among the proteins predicted to have both secretory signal peptide and strong GPI anchor addition signal, many were short, raising the question of how far the adhesive NT-Als domain could be projected away from the <italic>S. passalidarum</italic> cell surface to contact binding partners.</p>
<p>Comparison between the NT-Als domains for the predicted <italic>S. passalidarum</italic> proteins showed considerable sequence divergence from <italic>C. albicans</italic> NT-Als3 and from each other (<xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>). Many comparisons were in the range of 22-45% identity although greater sequence conservation was observed for some pairs (60-80% range). Contiguous loci (37-62% identity) were not necessarily more conserved than other comparisons. The most-conserved pair was SpAls55077 and SpAls134590 (89%) potentially indicating a gene duplication.</p>
</sec>
<sec id="s3_1_6">
<title><italic>Y. tenuis</italic></title>
<p>Interest in the <italic>Y. tenuis</italic> genome also arose from its xylose fermentation capabilities (<xref ref-type="bibr" rid="B83">Wohlbach et al., 2011</xref>). A single complete <italic>ALS</italic> locus was detected in the only <italic>Y. tenuis</italic> genome assembly available in the NCBI database (strain ATCC 10573; Candida tenuis v1.0; <xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>). The predicted YtAls93631 protein was &gt; 3000 amino acids and included a central domain of tandemly repeated sequences (32-45 amino acids; <xref ref-type="supplementary-material" rid="SM11"><bold>Supplementary File S11</bold></xref>). The most common repeat unit was 35 amino acids. The <italic>Y. tenuis</italic> genome sequence was quite fragmented, consisting of 74 contigs arranged onto 25 scaffolds. A second potential <italic>ALS</italic> locus was detected at the end of a scaffold sequence (CANTEscaffold_00010; 12.1 kb total length) suggesting that other <italic>Y. tenuis ALS</italic> loci may be revealed as the genome assembly matures.</p>
</sec>
<sec id="s3_1_7">
<title><italic>C. lusitaniae</italic></title>
<p><italic>C. lusitaniae</italic> is a less-frequent cause of human candidiasis (reviewed in <xref ref-type="bibr" rid="B19">Fran&#xe7;ois et al., 2001</xref>). Of the species considered here, <italic>C. lusitaniae</italic> was the most closely related to <italic>C. auris</italic> (<xref ref-type="fig" rid="f1"><bold>Figure 1</bold></xref>). More than 30 C<italic>. lusitaniae</italic> genome assemblies were available in the NCBI database. Observations here focused on strain ATCC 42720 (ASM383v1) which was comprised of 88 contigs arranged onto 9 scaffolds. One long <italic>ALS</italic> gene (&gt; 8 kb) was detected in this sequence (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>). BLAST of other available genomes also suggested a single <italic>ALS</italic> locus, although incomplete genome assemblies with many contigs may obscure the presence of other loci. Two different types of repeated DNA sequences were found in the center of <italic>ClALS3274</italic> (<xref ref-type="supplementary-material" rid="SM11"><bold>Supplementary File S11</bold></xref>). BLAST searching of the non-redundant nucleotide database suggested that the repeats predicting a 33 amino acid sequence were unique. The other repeated sequences were primarily 67 amino acids in length, although some repeat units expanded to 102 amino acids. Sequences within these longer repeats were reminiscent of motifs found in the Als consensus repeat from <italic>C. parapilsosis/C.orthopsilosis/C. metapsilosis</italic>, as well as the 80-amino-acid consensus repeat from <italic>S. passalidarum</italic> Als proteins (<xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>).</p>
</sec>
<sec id="s3_1_8">
<title><italic>D. hansenii</italic></title>
<p>Rather than being studied as a pathogen, <italic>D. hansenii</italic> is discussed commonly in the context of food production (summarized in <xref ref-type="bibr" rid="B27">Gori et al., 2011</xref>). <italic>D. hansenii</italic> growth requires surface adhesion (<xref ref-type="bibr" rid="B58">Mortensen et al., 2005</xref>), a property that might involve Als proteins. The NCBI database displayed 12 <italic>D. hansenii</italic> genome sequences, representing 11 different strains. This work focused on CBS 767 (ASM644v2), which was designated as the reference genome and had 15 contigs arranged on 8 scaffolds. A single <italic>ALS</italic> locus was detected, located on the chromosome G contig (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>). The predicted protein, DhAls2178, did not contain tandemly repeated sequences (<xref ref-type="supplementary-material" rid="SM11"><bold>Supplementary File S11</bold></xref>).</p>
</sec>
<sec id="s3_1_9">
<title><italic>C. glabrata</italic></title>
<p><italic>C. glabrata</italic> is well-recognized as a human pathogen, particularly for its ability to rapidly evolve resistance to antifungal drugs (<xref ref-type="bibr" rid="B79">Vale-Silva and Sanglard, 2015</xref>). Eighteen <italic>C. glabrata</italic> genomes were present in the NCBI database. BLAST of the strain CBS 138 sequence using <italic>ALS</italic> and Als queries revealed CAGL0G04125g, which was annotated to indicate similarity to <italic>S. cerevisiae</italic> Sag1 (<xref ref-type="supplementary-material" rid="SM11"><bold>Supplementary File S11</bold></xref>). Like Sag1, the <italic>C. glabrata</italic> predicted protein did not encode a central domain of tandemly repeated sequences.</p>
</sec>
</sec>
<sec id="s3_2">
<title>NT-Als Structural Predictions</title>
<p>The <italic>C. albicans</italic> NT-Als3 structure was solved crystallographically (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>; Protein Data Bank accession number 4LE8), providing experimental information that can be used to produce structural predictions for other NT-Als proteins. A crystallographic structure has not been reported for <italic>S. cerevisiae</italic> Sag1. The recent development of the highly accurate protein structural prediction program AlphaFold (<xref ref-type="bibr" rid="B39">Jumper et al., 2021</xref>) and widespread access to its use (e.g. <xref ref-type="bibr" rid="B57">Mirdita et al., 2021</xref>) provided the opportunity to assess predicted structural relatedness between the diverse set of NT-Als sequences and their similarity to Sag1.</p>
<p><xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref> shows the crystallographic structure of <italic>C. albicans</italic> NT-Als3 from 4LE8 (<xref ref-type="fig" rid="f3"><bold>Figure 3A</bold></xref>) and the AlphaFold-predicted structure for the same amino acid sequence (<xref ref-type="fig" rid="f3"><bold>Figure 3B</bold></xref>). The root-mean-square-deviation (RMSD) value for alignment of the two structures was 0.53, indicating the ability of AlphaFold to reproduce the crystallographic structure of NT-Als3 from its amino acid sequence. AlphaFold was then used to predict the structures of other NT-Als proteins, particularly those with limited sequence identity to <italic>C. albicans</italic> NT-Als3 (<xref ref-type="fig" rid="f3"><bold>Figures 3C&#x2013;G</bold></xref>). Strikingly, a similar structure was predicted for each protein, including Sag1. Analysis of each NT-Als sequence in <xref ref-type="supplementary-material" rid="SM5"><bold>Supplementary File S5</bold></xref> produced the same general protein shape (data not shown) suggesting that all, including Sag1, were unified as a family. To demonstrate diversity in structural predictions, the amino acid sequences for the N-terminal domain of the cell-surface proteins <italic>C. albicans</italic> Hyr1 (amino acids 21 to 309) and <italic>S. cerevisiae</italic> Flo1 (amino acids 25 to 273) were entered into AlphaFold. The resulting structural predictions were different from the Als family and from each other (<xref ref-type="fig" rid="f3"><bold>Figures 3H, I</bold></xref><bold>)</bold>.</p>
<fig id="f3" position="float">
<label>Figure 3</label>
<caption>
<p>Experimental and AlphaFold-predicted protein structures. <bold>(A)</bold> Crystallographic structure of <italic>C. albicans</italic> NT-Als3 (Protein Data Bank accession 4LE8) visualized using PyMOL. <bold>(B)</bold> <italic>C. albicans</italic> NT-Als3 structure predicted by AlphaFold from the 4LE8 amino acid sequence. AlphaFold structural predictions for the corresponding region of <italic>C. albicans</italic> NT-Als1 (<bold>C</bold>; 83% identical to NT-Als3), ClAls3274 (<bold>D</bold>; 33% identical to NT-Als3), ScSag1 (<bold>E</bold>; 25% identity), CauAls4498 (<bold>F</bold>; 31% identity), and CAGL0G04125g (<bold>G</bold>; 21% identity). An AlphaFold structural prediction was also completed for the N-terminal functional domain of <italic>C. albicans</italic> Hyr1 <bold>(H)</bold> and <italic>S. cerevisiae</italic> Flo1 <bold>(I)</bold> to demonstrate structural diversity among cell-surface proteins that contain a central domain of repeated sequences. The AlphaFold prediction for <italic>C. albicans</italic> NT-Als3 <bold>(B)</bold> recapitulated the known experimental structure (<bold>A</bold>; RMSD = 0.53 as calculated using PyMOL align). Predictions for molecules <bold>(B&#x2013;G)</bold> produced the same general structure suggesting that all should be included in the Als protein family. <xref ref-type="supplementary-material" rid="SM12"><bold>Supplementary File S12</bold></xref> shows the structures of <italic>C. albicans</italic> NT-Als3 <bold>(B)</bold> and ScSag1 <bold>(E)</bold> aligned with the disulfide bonds highlighted.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-11-794529-g003.tif"/>
</fig>
</sec>
<sec id="s3_3">
<title>Adhesive Activity Predictions From NT-Als Protein Features</title>
<p>In order to provide biologically meaningful adhesive activity on the fungal cell surface, Als proteins need a secretory signal peptide and GPI anchor addition site to achieve an effective localization (<xref ref-type="bibr" rid="B53">Lu et al., 1994</xref>). The crystallographic structure of <italic>C. albicans</italic> NT-Als3 (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>) demonstrated the involvement of 8 Cys residues in folding of the mature protein and the function of an invariant Lys at the end of the binding cavity that sinks the negative charge of incoming peptide ligands. Other work demonstrated the importance of the amyloid-forming region (AFR) for increasing the avidity of aggregative interactions (<xref ref-type="bibr" rid="B31">Ho et al., 2019</xref>). <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref> evaluated each of these features for the previously characterized and newly introduced Als proteins. The data were summarized in <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> from which various hypotheses emerged.</p>
<fig id="f4" position="float">
<label>Figure 4</label>
<caption>
<p>Visualization of NT-Als sequence features from <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>. Each spot represents an Als protein; color coding matches <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>. <italic>C. albicans</italic> NT-Als3 has 8 Cys that create four disulfide bonds (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>) while <italic>S. cerevisiae</italic> Sag1 has only 6 and is missing the C57-C133 disulfide bond that is present in NT-Als3 (<xref ref-type="bibr" rid="B70">Salgado et al., 2011</xref>). Most NT-Als proteins had 8 Cys like NT-Als3 (center column), some had 6 Cys like ScSag1 (left column), and others had varying numbers of Cys (range of 4 to 14; right column). Presence of the amyloid-forming region (AFR) in <italic>C. albicans</italic> Als proteins promotes protein aggregation (<xref ref-type="bibr" rid="B31">Ho et al., 2019</xref>). While many Als proteins had the expected AFR (strength and location; top row), others had a predicted weak AFR (second row) or none (bottom row). Some <italic>S. passalidarum</italic> Als proteins had a strong AFR 20-30 amino acids C-terminal to the expected location known in <italic>C. albicans</italic> (third row). It was unknown whether this alternative location contributed to aggregative potential. An invariant Lys in <italic>C. albicans</italic> NT-Als establishes a salt bridge with the C-terminal carboxylic acid of an incoming peptide ligand (<xref ref-type="bibr" rid="B70">Salgado et al., 2011</xref>). Arg (R) in this location may serve a similar function. Some predicted proteins did not have a positively charged amino acid in this position (X). A red asterisk indicates proteins featured in the structural predictions (<xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref>).</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-11-794529-g004.tif"/>
</fig>
<p>The cluster of dots in the top center of <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> contained proteins with 8 Cys and an invariant Lys. Each protein represented in the top center cluster of dots also had an AFR with high predicted &#x3b2;-aggregation potential and a location immediately C-terminal to the NT-Als domain as in <italic>C. albicans</italic> Als proteins (<xref ref-type="bibr" rid="B70">Salgado et al., 2011</xref>; <xref ref-type="bibr" rid="B49">Lipke et al., 2018</xref>). The top center cluster of dots included 7 of the 8 C<italic>. albicans</italic> Als proteins, 6 of 7 from <italic>C. dubliniensis</italic>, and 9 of 13 from <italic>C. tropicalis</italic> suggesting robust potential for functional adhesive interactions by these species. Also present in the top center cluster of dots were 2 of the <italic>S. stipitis</italic> Als proteins, 2 from <italic>S. passalidarum</italic>, and 1 each from <italic>C. parapsilosis</italic>, <italic>C. metapsilosis</italic>, <italic>L. elongisporus</italic>, and <italic>Y. tenuis</italic>.</p>
<p>Viewing potential Als function according to these criteria provided predictions about the adhesive activity in other species. For example, <italic>C. parapsilosis</italic>, <italic>C. orthopsilosis</italic>, and <italic>C. metapsilosis</italic> Als proteins almost universally had a weaker or absent AFR leading to the hypothesis that these species are functionally less adherent than <italic>C. albicans</italic>, <italic>C. dubliniensis</italic>, and <italic>C. tropicalis</italic>. Data in <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> suggested a similar hypothesis for <italic>S. passalidarum</italic>: despite its overabundance of <italic>ALS</italic>-like loci, <italic>S. passalidarum</italic> encoded only two proteins (SpAls138016 and SpAls156463; <xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>) that possessed the functional features present in NT-Als3 and therefore may not be a very adherent species. However, nine SpAls proteins had AFR sequences 20-30 amino acids C-terminal to the location where they are found in <italic>C. albicans</italic> Als3 (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>). Experimentation is required to evaluate whether sequences with high &#x3b2;-aggregation potential in this alternative location contribute to <italic>S. passalidarum</italic> aggregative interactions. Using the criteria in <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref>, <italic>C. lusitaniae</italic> was an outlier. Its sole Als protein, ClAls3274, had only 4 Cys residues and no AFR. Despite these key differences, the predicted structure for the NT-ClAls3274 domain was similar to those from other species (<xref ref-type="fig" rid="f3"><bold>Figure 3D</bold></xref>). The contribution of ClAls3274 remains to be tested, as does the overall adhesion profile for the species.</p>
<p>Proteins with features that more closely resemble Sag1 than <italic>C. albicans</italic> Als3 segregated to the left column of the diagram. Substitution of Arg (R printed in the dot) in place of the invariant Lys was a common theme. Three of the four <italic>M. guilliermondii</italic> Als proteins were in the left column. Perhaps these proteins have more-specific, higher-affinity adhesive interactions that more-closely resemble those of Sag1, rather than NT-Als3. The same prediction could be made for two of the <italic>C. auris</italic> proteins, as well as the sole protein from <italic>D. hansenii</italic>.</p>
<p>Information presented in <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> and <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref> showed that some species had a complement of Als proteins that possessed features of both <italic>S. cerevisiae</italic> Sag1 and <italic>C. albicans</italic> Als3. For example, <italic>S. stipitis</italic> SsAls4579 had Sag1-like features (lower left, <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref>) while SsAls2386 and SsAls2786 looked more like <italic>C. albicans</italic> Als3 (top center, <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref>). The line diagrams in <xref ref-type="supplementary-material" rid="SM9"><bold>Supplementary File S9</bold></xref> reinforced this idea, illustrating the extensive regions of tandemly repeated sequences in the latter two proteins (<italic>C. albicans</italic> Als-like) and lack of a repeated domain in SsAls4579 (Sag1-like). <italic>M. guilliermondii</italic> was a similar mixing bowl of Als proteins: MgAls673 was the most Sag1-like of the group. Each of the other MgAls proteins had a long stalk of tandemly repeated units with NT domains that perhaps were more like Sag1 than Als3 (<xref ref-type="supplementary-material" rid="SM7"><bold>Supplementary File S7</bold></xref>). <italic>L. elongisporus</italic> NT-Als proteins also appeared in more than one column in <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> with one (LeAls734) sharing greater similarity with Sag1. The recombinant nature of some of the LeAls proteins presented a more-complex picture than for <italic>S. stipitis</italic> or <italic>M. guilliermondii</italic> (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary File S6</bold></xref>).</p>
</sec>
<sec id="s3_4">
<title>Drawing a Tree to Visualize NT-Als Relatedness</title>
<p>In addition to comparing NT-Als proteins based on the features described above, more-global comparisons were made. Clustal Omega alignment of the NT-Als sequences (<xref ref-type="supplementary-material" rid="SM5"><bold>Supplementary File S5</bold></xref>) showed identity values ranging from approximately 20% to 90% (data not shown). A maximum likelihood tree was drawn to visualize the results (<xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref><bold>)</bold>.</p>
<fig id="f5" position="float">
<label>Figure 5</label>
<caption>
<p>Relationships between NT-Als sequences depicted in a tree format. Information from <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> (number of Cys in NT-Als, presence of the invariant Lys, nature of the AFR) is included using symbols at the left of the tree. Yellow hexagons on the right of the branches depict ortholog group information from <xref ref-type="table" rid="T3"><bold>Table 3</bold></xref>. Colored dots indicating species follow the color scheme from <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref> and <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref>. The scale bar represents substitutions per site.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-11-794529-g005.tif"/>
</fig>
<p>The topology of the tree reflected the overall diversity in NT-Als sequence identity. For example, NT-Als sequences from the closely related species <italic>C. parapsilosis</italic>/<italic>C. orthopsilosis</italic>/<italic>C. metapsilosis</italic> appeared on short branches in tight groups. In constrast, many branches showing the relationship between the highly diverse <italic>S. passalidarum</italic> NT-Als sequences were quite long, most notably for SpAls153035.5, which was the least related to other proteins in that species.</p>
<p>Als sequences from the same species tended to cluster together which made the overall tree organization similar to the species tree in <xref ref-type="fig" rid="f1"><bold>Figure 1</bold></xref>. The close relationship between <italic>C. albicans</italic> and <italic>C. dubliniensis</italic> (<xref ref-type="bibr" rid="B35">Jackson et al., 2009</xref>), as well as that between <italic>C. parapsilosis</italic>/<italic>C. orthopsilosis</italic>/<italic>C. metapsilosis</italic> (<xref ref-type="bibr" rid="B78">Tavanti et al., 2005</xref>), were reflected by the proteins from these groups being localized to distinct regions of the tree. <italic>C. tropicalis</italic> sequences were similarly clustered as were most of the <italic>S. passalidarum</italic> sequences. <italic>C. auris</italic> and <italic>C. lusitaniae</italic> sequences were grouped closely, similar to their position on the species tree (<xref ref-type="fig" rid="f1"><bold>Figure 1</bold></xref>). Within the groupings of closely related species, orthologs were obvious (e.g. CaAls6/CdAls86290, CaAls7/CdAls86150, CpAls660/CoAls800 and CoAls4210/CmAls4210-1). Examples of paralogs, likely the result of gene duplication, included CpAls4770/CpAls4780/CpAls4800, CtrAls3791/CtrAls2293/CtrAls3786, and SpAls64434/SpAls64435.</p>
<p>Similar to predictions made from the <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref> diagram, NT-Als sequences from some species were spread across the tree. The four <italic>M. guilliermondii</italic> Als sequences were found in three different locations: MgAls673 was grouped more closely to sequences like ScSag1; MgAls2302 and MgAls3259 were clustered together near proteins from <italic>C. auris</italic>; and MgAls3330 was on its own branch elsewhere on the tree. Low bootstrap support for the latter location suggested that MgAls3330 could easily be located differently on the tree. The three sequences from <italic>S. stipitis</italic> were also dispersed with one near ScSag1 and the two others closer to the <italic>C. albicans/C. dubliniensis</italic> proteins. The five <italic>L. elongisporus</italic> Als proteins were split into two groups: the first including LeAls2536/LeAls5708/LeAls2721 (likely paralogs) and the second including LeAls734/LeAls2716 (recombinants between Als and Iff/Hyr). The Sag1-like features for SsAls4579 and MgAls673 were reflected on the tree (<xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref>), while LeAls734 and LeAls2716 (both Als recombinants with Iff/Hyr) clustered together in a different location.</p>
<p>The tree in <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref> was drawn from a portion of each protein sequence. Another way to evaluate phylogenetic relationships is via conservation of physical location (synteny) as depicted using the <italic>Candida</italic> Gene Order Browser (CGOB; <xref ref-type="bibr" rid="B55">Maguire et al., 2013</xref>). CGOB includes all species in <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref> except <italic>C. glabrata</italic> (<italic>CAGL0G04125g</italic>). A screenshot from one region of the CGOB was included in <xref ref-type="fig" rid="f2"><bold>Figure 2C</bold></xref>. It showed genes from several different fungal species that were orthologs of <italic>C. albicans ALS6</italic> and <italic>ALS7</italic>. Orthologs reported by CGOB are shown in <xref ref-type="table" rid="T3"><bold>Table 3</bold></xref>. Yellow hexagons with alphabetical labels were used to display the CGOB relationships on the tree in <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref>.</p>
<table-wrap id="T3" position="float">
<label>Table 3</label>
<caption>
<p>Orthologous <italic>ALS</italic> loci reported on <italic>Candida</italic> Gene Order Browser (CGOB).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Reference Gene</th>
<th valign="top" align="center">Reported Ortholog</th>
<th valign="top" align="center">Group*</th>
<th valign="top" align="center">Reference Gene</th>
<th valign="top" align="center">Reported Ortholog</th>
<th valign="top" align="center">Group*</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>CaALS1</italic></td>
<td valign="top" align="left"><italic>CdALS64210</italic></td>
<td valign="top" align="center"><bold>A</bold></td>
<td valign="top" align="left"><italic>CaALS7</italic></td>
<td valign="top" align="left"><italic>CdALS86150</italic></td>
<td valign="top" align="center"><bold>F</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SsALS2386</italic><sup>&#x2020;</sup></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CtrALS2228</italic></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CpALS4800</italic></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"><italic>CaALS2</italic></td>
<td valign="top" align="left"><italic>CdALS64800</italic></td>
<td valign="top" align="center"><bold>B</bold></td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CoALS4220</italic></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CtrALS3786</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>LeALS2721</italic></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS68952</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CaALS9</italic></td>
<td valign="top" align="left"><italic>CdALS64220</italic></td>
<td valign="top" align="center"><bold>G</bold></td>
</tr>
<tr>
<td valign="top" align="left"><italic>CaALS3</italic></td>
<td valign="top" align="left"><italic>YtALS93631</italic></td>
<td valign="top" align="center"><bold>C</bold></td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>LELG_04272</italic><sup>&#x2021;</sup></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS134590</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>ScFLO1</italic><sup>&#x2021;</sup></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" colspan="6" align="left"/>
</tr>
<tr>
<td valign="top" align="left"><italic>CaALS4</italic></td>
<td valign="top" align="left"><italic>CdALS64610</italic></td>
<td valign="top" align="center"><bold>D</bold></td>
<td valign="top" align="left"><italic>CpALS4780</italic></td>
<td valign="top" align="left"><italic>CoALS4210</italic></td>
<td valign="top" align="center"><bold>H</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CauALS2582</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CmALS800</italic><sup>&#x2020;</sup></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>ClALS3274</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>PICST_31095</italic><sup>&#x2021;</sup></td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>MgALS3330</italic></td>
<td valign="top" align="left"><italic>CpALS660</italic></td>
<td valign="top" align="center"><bold>I</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>MgALS3259</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CoALS800</italic></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" colspan="6" align="left"/>
</tr>
<tr>
<td valign="top" align="left"><italic>CaALS6</italic></td>
<td valign="top" align="left"><italic>CdALS86290</italic></td>
<td valign="top" align="center"><bold>E</bold></td>
<td valign="top" align="left"><italic>DhALS2178</italic><sup>&#xa7;</sup></td>
<td valign="top" align="left"><italic>SsALS4579</italic></td>
<td valign="top" align="center"><bold>J</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CtrALS2229</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>MgALS673</italic></td>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CpALS4790</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>CmALS4220</italic><sup>&#x2020;</sup></td>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>ScSAG1</italic></td>
<td valign="top" align="left"><italic>CdALS65010</italic></td>
<td valign="top" align="center"><bold>K</bold></td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>LeALS2716</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>SpALS141433</italic></td>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>*Group designations were noted within yellow hexagons in <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref>.</p>
</fn>
<fn>
<p><sup>&#x2020;</sup>For clarity, gene names from <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref> were used here instead of the ORF designations on CGOB. SsALS2386 was called PICST_4539 on CGOB; CmALS4220 was called CMET_1838 on CGOB, and CmALS800 was called CMET_3970.</p>
</fn>
<fn>
<p><sup>&#x2021;</sup>PICST_31095 belonged to the IFF/HYR family instead of the ALS family. LELG_04272 lacked an NT-Als domain but had tandem repeats and C-terminal sequence features similar to ALS genes. ScFLO1 belongs to a family of flocculins (<xref ref-type="bibr" rid="B26">Goossens et al., 2011</xref>). Although flocculins also have a central domain of repeated sequences, the structure of the mannose-binding N-terminal domain is clearly different from NT-Als (<xref ref-type="fig" rid="f3"><bold>Figure 3I</bold></xref>).</p>
</fn>
<fn>
<p><sup>&#xa7;</sup>Although not ALS genes, CaFGR23 (orf19.1616), Cd82280, and Ctr2409 were also in this ortholog pillar.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>CGOB ortholog designations were most reliable in closely related species such as <italic>C. albicans</italic> and <italic>C. dubliniensis</italic>: each <italic>C. albicans</italic> locus had a <italic>C. dubliniensis</italic> ortholog except <italic>CaALS3</italic> and <italic>CaALS5</italic> which are missing from the <italic>C. dubliniensis</italic> genome (<xref ref-type="bibr" rid="B35">Jackson et al., 2009</xref>). These ortholog groups were frequently augmented with genes from other species such as Group A which included <italic>SsALS2386</italic>. Groups E and F were the largest, suggesting ortholog relationships between genes in 7 and 6 species, respectively.</p>
<p>CGOB also proposed ortholog groups that did not include <italic>C. albicans</italic> or <italic>C. dubliniensis</italic> sequences. One example was Group J that included the <italic>SAG1</italic>-like <italic>MgALS673</italic> and <italic>SsALS4579</italic>, as well as <italic>DhAls2178</italic>, the lone <italic>ALS</italic> sequence from the primarily haploid <italic>D. hansenii</italic>. Examination of the predicted protein sequence showed lack of a tandem repeat domain as well as other Sag1-like features (<xref ref-type="supplementary-material" rid="SM11"><bold>Supplementary File S11</bold></xref> and <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref>).</p>
<p>Some CGOB ortholog designations were perhaps problematic. For example, <italic>PICST_31095</italic> (Group D) belonged to the <italic>IFF/HYR</italic> family instead of <italic>ALS</italic> and <italic>ScFLO1</italic>(Group G) encoded a flocculin with a mannose-binding N-terminal domain that was structurally diverse from the Als family (<xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref>). Perhaps the most intriguing ortholog designation was Group K which included <italic>ScSAG1</italic> and <italic>CdALS65010</italic>. <italic>CdALS65010</italic> was nearly 100% identical to <italic>CdALS64800</italic>, which was included in ortholog Group B. These loci are near each other on <italic>C. dubliniensis</italic> chromosome 6 and the appear to be paralogs (i.e. recently duplicated; <xref ref-type="bibr" rid="B35">Jackson et al., 2009</xref>). As species become more divergent, assessing ortholog designations becomes more challenging. However, the suggestion of orthology between <italic>ScSAG1</italic> and a <italic>C. dubliniensis ALS</italic> gene supported the general idea that the genes were part of the same family and arose from a common ancestor.</p>
</sec>
<sec id="s3_5">
<title>Probing the Taxonomic Boundaries of the <italic>ALS</italic> Family</title>
<p>The rapidly increasing number of genome sequences present in public databases provided an opportunity to further explore the breadth and potential origin of the <italic>ALS</italic> family. The NCBI database can be queried using taxonomic identification (taxid) numbers to detect potential <italic>ALS</italic> loci more broadly across the phylogenetic tree. <xref ref-type="table" rid="T4"><bold>Table 4</bold></xref> lists the taxids for designations of the major Families within the Order Saccharomycetales. Inputs from NCBI (lifemap-ncbi-univ-lyon1.fr), <xref ref-type="bibr" rid="B74">Shen et al. (2018)</xref>, and <xref ref-type="bibr" rid="B45">Li et al. (2021)</xref> were included although the taxonomic designations were not identical among the sources. The portion of the kingdom Fungi tree (<xref ref-type="bibr" rid="B45">Li et al., 2021</xref>) that represented the Subphylum Saccharomycotina was reproduced in <xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>.</p>
<table-wrap id="T4" position="float">
<label>Table 4</label>
<caption>
<p><italic>ALS</italic> gene representation within the Order Saccharomycetales*.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="left">Family</th>
<th valign="top" align="center">Genus/species</th>
<th valign="top" align="center"># <italic>ALS</italic> Loci</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>Debaryomycetaceae</italic> (taxid:766764); included in CUG-Ser1 (<xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>)</td>
<td valign="top" align="left"><italic>Candida albicans</italic> (taxid:5476)</td>
<td valign="top" align="center">8</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida dubliniensis</italic> (taxid:42373)</td>
<td valign="top" align="center">7</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida tropicalis</italic> (taxid:5482)</td>
<td valign="top" align="center">13</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida parapsilosis</italic> (taxid:5480)</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida orthopsilosis</italic> (taxid:273371)</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida metapsilosis</italic> (taxid:273372)</td>
<td valign="top" align="center">4</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Lodderomyces elongisporus</italic> (taxid:36914)</td>
<td valign="top" align="center">5</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Debaryomyces hansenii</italic> (taxid:4959)</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Meyerozyma guilliermondii</italic> (taxid:4929)</td>
<td valign="top" align="center">4</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Scheffersomyces stipitis</italic> (taxid:4924)</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Spathaspora passalidarum</italic> (taxid:340170)</td>
<td valign="top" align="center">29</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Yamadazyma tenuis</italic> (taxid:2315449)</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Metschnikowiaceae</italic> (taxid:27319); included in CUG-Ser1 (<xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>)</td>
<td valign="top" align="left"><italic>Clavispora lusitaniae</italic> (taxid:36911)</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida auris</italic> (taxid:498019)</td>
<td valign="top" align="center">3</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Saccharomycetaceae</italic> (taxid:4893)</td>
<td valign="top" align="left"><italic>Saccharomyces cerevisiae</italic> (taxid:4932)</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"><italic>Candida glabrata</italic> (taxid:5478)</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Pichiaceae</italic> (taxid:1156497)</td>
<td valign="top" align="left"><italic>Pichia kudriavzevii</italic> (taxid:4909)</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
<td valign="top" align="left"/>
</tr>
<tr>
<td valign="top" align="left"/>
<td valign="top" align="center"><bold>Number of Species with an</bold><break/><bold>Available Genome Sequence</bold><break/><bold>in the NCBI Database</bold><break/><bold>(Accessed September 2021)</bold></td>
<td valign="bottom" align="center"><bold>Potential <italic>ALS</italic> Loci</bold></td>
</tr>
<tr>
<td valign="top" align="left"><italic>Lipomycetaceae</italic> (taxid:29827)</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Trignopsidaceae</italic> (taxid:1540145)</td>
<td valign="top" align="center">6</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Dipodascaceae</italic> (taxid:34353)</td>
<td valign="top" align="center">32</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Trichomonascaceae</italic> (taxid:410830)</td>
<td valign="top" align="center">26</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Alloascoideaceae</italic> (taxid:1540229)</td>
<td valign="top" align="center">1</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Sporopachydermia</italic> clade (taxid:45793)</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Cephaloascaceae</italic> (taxid:28984); included in CUG-Ser1 (<xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>)</td>
<td valign="top" align="center">2</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Pichiaceae</italic> (taxid:1156497)</td>
<td valign="top" align="center">60</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Saccharomycopsidaceae</italic> (taxid:34366); overlap with CUG-Ser2 (<xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>)</td>
<td valign="top" align="center">9</td>
<td valign="top" align="center">1</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Phaffomycetaceae</italic> (taxid:115784)</td>
<td valign="top" align="center">39</td>
<td valign="top" align="center">14</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Saccharomycodaceae</italic> (taxid:34365)</td>
<td valign="top" align="center">21</td>
<td valign="top" align="center">0</td>
</tr>
<tr>
<td valign="top" align="left"><italic>Saccharomycetales incertae sedis</italic> (taxid:241407)</td>
<td valign="top" align="center">37</td>
<td valign="top" align="center">4</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>*Family designations were from lifeman-ncbi-univ-lyon1.fr, as well as the work of <xref ref-type="bibr" rid="B74">Shen et al. (2018)</xref> and <xref ref-type="bibr" rid="B45">Li et al. (2021)</xref>. Taxid numbers were from the NCBI Taxonomy Database (<uri xlink:href="https://www.ncbi.nlm.nih/gov/taxonomy">https://www.ncbi.nlm.nih/gov/taxonomy</uri>). Numbers of ALS loci (right column; top half of table) were taken from the genome sequences examined in this study (<xref ref-type="table" rid="T1"><bold>Table 1</bold></xref>).</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f6" position="float">
<label>Figure 6</label>
<caption>
<p>Phylogenetic tree of Families in the Order Saccharomycetales. The tree was traced from the data of <xref ref-type="bibr" rid="B45">Li et al. (2021)</xref> to highlight the region of interest for the current study. Family names were those used by <xref ref-type="bibr" rid="B45">Li et al. (2021)</xref>. <xref ref-type="table" rid="T4"><bold>Table 4</bold></xref> placed these names into the context of Family designations used on the NCBI Taxonomy Database (<xref ref-type="bibr" rid="B72">Schoch et al., 2020</xref>). The red dot denotes the common ancestor of the CUG-Ser1 clade and <italic>Saccharomycetaceae</italic>, the two groups in which <italic>ALS</italic> genes were most common (indicated by larger font). <italic>ALS</italic> genes were also detected in the <italic>Phaffomycetaceae</italic>.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-11-794529-g006.tif"/>
</fig>
<p><xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref> indicated the position of a common ancestor (red dot) for the <italic>ALS</italic> family that would include both <italic>S. cerevisiae SAG1</italic> (in the <italic>Saccharomycetaceae</italic>) and genes more closely resembling <italic>C. albicans ALS</italic> loci (in CUG-Ser1). BLAST searching using taxids did not reveal <italic>ALS</italic> loci in available genome sequences from the <italic>Lipomycetaceae</italic>, <italic>Trignopsidaceae</italic>, <italic>Dipodascaceae</italic>, <italic>Trichomonascaceae</italic>, <italic>Alloascoidaceae</italic>, or the <italic>Sporopachydermia</italic> clade (<xref ref-type="table" rid="T4"><bold>Table 4</bold></xref>). CUG-Ser1 was comprised of the <italic>Debaryomycetaceae</italic>, <italic>Metschnikowiaceae</italic>, and <italic>Cephaloascaceae</italic> (<xref ref-type="bibr" rid="B74">Shen et al., 2018</xref>). BLAST searching using taxids suggested that there were numerous additional <italic>ALS</italic> genes among the 88 <italic>Debaryomycetaceae</italic> species genomes in NCBI (accessed September 2021). Among the 62 <italic>Metschnikowiaceae</italic> species, <italic>ALS</italic> sequences were found primarily in species closely related to <italic>C. auris</italic> and <italic>C. lusitaniae</italic> including <italic>Candida haemulonii</italic>, <italic>Candida duobushaemulonis</italic>, and <italic>Candida pseudohaemulonii</italic>, all of which have been observed as pathogens (<xref ref-type="bibr" rid="B40">Jurardo-Martin et al., 2020</xref>). <italic>C. intermedia</italic>, noted for its ability to ferment xylose, as well as a rare cause of catheter-related fungemia (<xref ref-type="bibr" rid="B69">Ruan et al., 2010</xref>; <xref ref-type="bibr" rid="B23">Geijer et al., 2020</xref>) also had <italic>ALS</italic> sequences. No <italic>ALS</italic> sequences were detected in the <italic>Cephaloascaceae</italic>, although only 2 genomes were available (<xref ref-type="table" rid="T4"><bold>Table 4</bold></xref>).</p>
<p><italic>Pichia kudriavzevii</italic> (formerly <italic>Candida krusei</italic>; <xref ref-type="bibr" rid="B12">Douglass et al., 2018</xref>) was included in <xref ref-type="table" rid="T4"><bold>Table 4</bold></xref> and in <xref ref-type="fig" rid="f1"><bold>Figure 1</bold></xref> since the species is among those associated with clinical disease (<xref ref-type="bibr" rid="B25">Gomez-Gaviria and Mora-Montes, 2020</xref>). However, <italic>ALS</italic> genes were not detected in <italic>Pichia kudriavzevii</italic>, nor in the genomes of 60 other species from the Family <italic>Pichiaceae</italic> that were available in the NCBI database (<xref ref-type="table" rid="T4"><bold>Table 4</bold></xref>). No <italic>ALS</italic> sequences were detected in the species included in the CUG-Ala clade (<xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>). The lone BLAST hit in the <italic>Saccharomycopsidaceae</italic> (<xref ref-type="table" rid="T4"><bold>Table 4</bold></xref>; overlap with CUG-Ser2 in <xref ref-type="fig" rid="f6"><bold>Figure 6</bold></xref>) was based more on the presence of Ser/Thr-rich repeated sequences than on an NT-Als adhesive domain. Additional work would be required to validate the sequence and determine if an NT-Als domain was present.</p>
<p>Potential <italic>ALS</italic> genes in the <italic>Phaffomycetaceae</italic> (<xref ref-type="table" rid="T4"><bold>Table 4</bold></xref>) were located in two species each in the genera <italic>Wickerhamomyces</italic> and <italic>Cyberlindnera</italic>; each locus encoded a potential NT-Als domain. Many additional <italic>ALS</italic> sequences were found among the 104 <italic>Saccharomycetaceae</italic> genomes available in NCBI. This family included <italic>S. cerevisiae</italic>, for which <italic>SAG1</italic> was the only BLAST hit. For other species such as <italic>Torulospora delbrueckii</italic>, a species of interest for wine making and baking (<xref ref-type="bibr" rid="B17">Fernandes et al., 2021</xref>), more than one <italic>ALS</italic> sequence was detected in the genome. One (<italic>TDEL_0E04030</italic>) predicted a protein that more closely resembled <italic>S. cerevisiae</italic> Sag1, while another (<italic>TDEL_0G04810</italic>) encoded an NT-Als domain (validated using AlphaFold; data not shown) attached to a complex C-terminal Ser/Thr-rich sequence. This predicted C-terminal domain was notable because it included 5 copies of the 45-amino acid tandem repeat found in <italic>S. cerevisiae</italic> Flo1 (<xref ref-type="bibr" rid="B77">Soares, 2010</xref>), suggesting recombination between the <italic>ALS</italic> and <italic>FLO</italic> families. A predicted protein in <italic>Lachancea thermotolerans</italic> (KLTH0C00440p) suggested an even-more-convincing recombinant that had an NT-Als domain attached to &gt; 30 copies of the Flo1 tandem repeat. These sequences require verification to ensure the recombinants were part of the genome, rather than an artifact of computational genome assembly. <italic>ALS</italic> sequences were also detected in <italic>Kazachstania</italic> species extending the representation of <italic>ALS</italic> sequences throughout the <italic>Saccharomycetaceae</italic> as defined by <xref ref-type="bibr" rid="B74">Shen et al. (2018)</xref>. Many of these sequences appeared partial, suggesting the need for PCR amplification and repair to reveal the true nature of their encoded proteins. No <italic>ALS</italic> sequences were detected among the 21 <italic>Saccharomycodaceae</italic> species queried.</p>
<p>The taxonomic category <italic>Saccharomycetales incerta sedis</italic> had four <italic>ALS</italic> sequences, all in the species <italic>Diutina rugosa</italic> (formerly <italic>Candida rugosa</italic>), which is noted as an infrequent human pathogen (<xref ref-type="bibr" rid="B56">Ming et al., 2019</xref>). Evaluation of the best hit (<italic>DIURU_002000</italic>) showed a predicted secretory signal peptide and GPI anchor addition site. Within the NT-Als region, DIURU_002000 was 37% identical to <italic>C. albicans</italic> NT-Als3, had 8 Cys in the expected locations, Arg instead of the invariant Lys, and a strong predicted AFR. AlphaFold produced the same general structure for the DIURU_002000 NT-Als protein as for those shown in <xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref> (data not shown).</p>
<p>Collectively, these observations pinpointed the location of the <italic>ALS</italic> family among currently available genome sequences and suggested potential taxonomic boundaries that will continue to be tested as more genome sequences are added to this region of the phylogenetic tree.</p>
</sec>
</sec>
<sec id="s4" sec-type="discussion">
<title>Discussion</title>
<p>Availability of genome resources for pathogenic yeasts, as well as other closely related species, provided a comparative view of the <italic>ALS</italic> family across a broader expanse of the phylogenetic tree than previously investigated. Despite advances in long-read DNA sequence technologies, many <italic>ALS</italic> loci still required PCR amplification and Sanger sequencing to derive an accurate gene count and sequence. The availability of the unprecedented protein structural prediction accuracy of AlphaFold (<xref ref-type="bibr" rid="B39">Jumper et al., 2021</xref>) provided the opportunity to demonstrate conservation of NT-Als domain shape for the proteins listed in <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>. Recent addition of more than 200 new budding yeast genome sequences into the NCBI database (<xref ref-type="bibr" rid="B74">Shen et al., 2018</xref>) further bridged the gap between <italic>S. cerevisiae</italic> and <italic>C. albicans</italic> and provided a clearer picture of the <italic>ALS</italic> family breadth. In total, the information leads to the conclusions that <italic>S. cerevisiae</italic> Sag1 is an Als protein and the Als family is far more diverse than previously described.</p>
<p>Presence of the NT-Als domain is universal among the proteins in <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>, and clearly is a defining characteristic for inclusion in the Als family. The AFR is recognized as part of the NT-Als domain (<xref ref-type="bibr" rid="B46">Lin et al., 2014</xref>); this sequence was absent, weaker, or perhaps in another location in many of the newly characterized Als proteins described here. Immediately following the AFR in <italic>C. albicans</italic> Als proteins is a short Thr-rich region that some publications refer to as the T domain (reviewed in <xref ref-type="bibr" rid="B32">Hoyer and Cota, 2016</xref>). The T domain in <italic>C. albicans</italic> Als proteins ends at the start of the tandem repeat region. Designating a T domain in many of the proteins described here would require arbitrary judgement calls so the region was not included in any of the line diagrams (<xref ref-type="supplementary-material" rid="SM6"><bold>Supplementary Files S6</bold></xref><bold>-</bold><xref ref-type="supplementary-material" rid="SM11"><bold>S11</bold></xref>). NT-Als domains were drawn to include all amino acids up to the start of the repeated sequences or Ser/Thr-rich regions.</p>
<p>In some proteins (e.g. SpAls55077, SpAls134590, ClAls3274), sequences similar to the <italic>C. albicans</italic> T domain are expanded into repeated sequences of variable length in the center of the protein. While all <italic>C. albicans</italic> Als proteins have a region of highly conserved, 36-amino-acid tandemly repeated sequences, this part of the Als protein is quite variable among those from other species. Variations include tandem copies of novel lengths and sequences, repeated sequences that are not necessarily tandem copies, and complete lack of repeated sequences. The latter presentation is characteristic of <italic>S. cerevisiae</italic> Sag1 and other proteins more closely related to ScSag1 on the <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref> tree. Sequences most C-terminal in the Als family are also diverse, many featuring an enriched Ser/Thr composition. Ser/Thr richness promotes O-glycosylation that can form an extended structure on which the NT-Als domain is displayed on the cell surface (<xref ref-type="bibr" rid="B37">Jentoft, 1990</xref>). Some of the Als proteins have other amino acids (e.g. Glu, Gly, Pro) that are also enriched in the C-terminal portion of the protein or in novel, short repeated sequences.</p>
<p>Inclusion in the Als family is focused on the presence of an NT-Als domain that has the same general shape as the proteins described here (<xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref>). This Als family definition also recognizes instances of recombination between <italic>ALS</italic> genes and others encoding cell-surface proteins. A previous report (<xref ref-type="bibr" rid="B63">Oh et al., 2019</xref>) described <italic>CmALS2265</italic>, the product of recombination between <italic>ALS</italic> genes and the <italic>IFF/HYR</italic> family (<xref ref-type="bibr" rid="B1">Bailey et al., 1996</xref>; <xref ref-type="bibr" rid="B2">Bates et al., 2007</xref>; <xref ref-type="bibr" rid="B8">Chaffin, 2008</xref>; <xref ref-type="bibr" rid="B4">Boisram&#xe9; et al., 2011</xref>; <xref ref-type="bibr" rid="B67">Riccombeni et al., 2012</xref>). In the present study, additional recombinants between <italic>ALS</italic> and <italic>IFF/HYR</italic> genes were noted in <italic>L. epongisporus</italic> (<italic>LeALS734</italic> and <italic>LeALS2716</italic>). The&#xa0;tantalizing possibility of <italic>ALS/FLO</italic> recombinants in <italic>T. delbrueckii</italic> and <italic>L. thermotolerans</italic> suggests even-greater interfamily recombination as a mechanism for generating diversity on the fungal cell surface. Recombination, as the mechanism to generate novel adhesins, has been discussed previously (<xref ref-type="bibr" rid="B81">Verstrepen et al., 2004</xref>; <xref ref-type="bibr" rid="B80">Verstrepen et al., 2005</xref>) although these descriptions involved recombination between genes in the same family. In contrast, interfamily recombination places the functional NT domain from one family onto the glycosylated stalk from another. Predicted structures for the NT domains of Als, Iff/Hyr, and Flo proteins were included in <xref ref-type="fig" rid="f3"><bold>Figure 3</bold></xref> to highlight their obvious differences. Potential for hybrid function expands if the glycosylated stalk is more than just a pedestal for displaying the NT domain. These observations provide ample experimental hypotheses to pursue to better understand cell-surface diversity among the yeast species.</p>
<p>Another novel observation from the current work is the subtelomeric localization of <italic>ALS</italic> genes in multiple species including <italic>M. guilliermondii</italic> (<italic>MgALS2302</italic>, <italic>MgALS3259</italic>), <italic>C. auris</italic> (<italic>CauALS2582</italic>), and <italic>S. passalidarum</italic> (<italic>SpALS131476</italic>, <italic>SpALS137089</italic>). <italic>C. albicans</italic> subtelomeric regions are described as hotspots for genomic rearrangement, although adhesin-encoding genes are not located there (<xref ref-type="bibr" rid="B15">Dunn and Anderson, 2019</xref>). Subtelomeric location of adhesin genes is well-documented in other species such as <italic>C. glabrata</italic> (<xref ref-type="bibr" rid="B85">Xu et al., 2020</xref>). However, analysis of long-read-based genome sequences from three <italic>C. glabrata</italic> isolates suggested that changes in subtelomeric adhesin-encoding genes is due to break-induced replication, a relatively rare event that affects only the gene closest to the telomere (<xref ref-type="bibr" rid="B86">Xu et al., 2021</xref>). <xref ref-type="bibr" rid="B59">Mu&#xf1;oz et al. (2021)</xref> noted <italic>C. auris</italic> subtelomeric regions rich in genes encoding Iff/Hyr proteins, candidate cell wall proteins unique to that species, and CauAls2582. Analysis of genome sequences from 12 C<italic>. auris</italic> isolates representing diverse clades showed that Clade II isolates lose large subtelomeric regions and the cell wall genes associated with them (<xref ref-type="bibr" rid="B59">Mu&#xf1;oz et al., 2021</xref>). The consequences of <italic>ALS</italic> gene location in the subtelomeric region remain to be further explored in species such as <italic>M. guilliermondii</italic> and <italic>S. passalidarum</italic>.</p>
<p>By including Sag1 in the Als family, the definition of Als function also becomes more diverse. Sag1 binds a very specific ligand (the C-terminal peptide of <bold>a</bold>-agglutinin; <xref ref-type="bibr" rid="B7">Cappellaro et al., 1994</xref>) with high affinity. In comparison, <italic>C. albicans</italic> Als proteins can bind many ligands with lower affinity and rely on AFR-mediated protein aggregation to increase avidity (reviewed in <xref ref-type="bibr" rid="B32">Hoyer and Cota, 2016</xref>; <xref ref-type="bibr" rid="B31">Ho et al., 2019</xref>). Similar to those in <italic>C. albicans</italic>, several of the more-recently described Als proteins in other species function in adhesion to host cells or protein-coated surfaces (<xref ref-type="bibr" rid="B3">Bertini et al., 2016</xref>; <xref ref-type="bibr" rid="B60">Neale et al., 2018</xref>; <xref ref-type="bibr" rid="B93">Zoppo et al., 2018</xref>; <xref ref-type="bibr" rid="B52">Lombardi et al., 2019</xref>; <xref ref-type="bibr" rid="B91">Zoppo et al., 2020a</xref>; <xref ref-type="bibr" rid="B92">Zoppo et al., 2020b</xref>). However, considerable effort is still required to understand the specifics of these interactions. Information in <xref ref-type="fig" rid="f3"><bold>Figures 3</bold></xref>, <xref ref-type="fig" rid="f5"><bold>5</bold></xref> can be used to select proteins from along the newly defined Als family spectrum to better understand how structure contributes to functional variation. Experiments involving purified proteins and biophysical techniques could be pursued, or perhaps individual genes or chimeric constructs could be expressed in model systems such as the recently described <italic>ALS</italic>-negative <italic>C. orthopsilosis</italic> strain (<xref ref-type="bibr" rid="B94">Zoppo et al., 2019</xref>). Experimentally demonstrated structural solutions could also be pursued, and in place of the difficult-to-crystallize ScSag1, proteins close to ScSag1 on the <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref> tree may serve as informative surrogates (e.g. Group J and CAGL0G04125G, which may be mating glycoproteins from the haploid species <italic>M. guilliermondii</italic>, <italic>D. hansenii</italic>, and <italic>S. stipitis</italic>).</p>
<p>The <italic>ALS</italic> alleles listed in <xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref> are quite long: many are at least 5 kb and one is over 15 kb. In <italic>C. albicans</italic>, where multiple strains and <italic>ALS</italic> alleles have been examined, these long ORFs are maintained without interruption. One notable example is <italic>C. albicans ALS7</italic> that experiences frequent expansions and contractions of multiple different repeated sequences and is transcribed at an extremely low level that may not produce sufficient protein for biologically meaningful adhesive interactions (<xref ref-type="bibr" rid="B87">Zhang et al., 2003</xref>; <xref ref-type="bibr" rid="B28">Green et al., 2005</xref>). In contrast, the current study revealed the first example of <italic>ALS</italic> pseudogenes. They are found in <italic>S. passalidarum</italic> that has amplified the <italic>ALS</italic> family to 29 loci, well beyond the census in other characterized species (<xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>). In addition to the <italic>ALS</italic> pseudogenes, many of the other <italic>S. passalidarum ALS</italic> loci encode proteins that are predicted to mislocalize compared to the <italic>C. albicans</italic> model: lack of a secretory signal peptide suggests protein that accumulates inside the cell rather than on the surface. The presence of loci that encode proteins with secretory potential, but lacking the ability to cross-link into the cell wall (i.e. no GPI anchor addition site), suggests the potential for <italic>S. passalidarum</italic> to export its own adhesion inhibitors. For example, a secreted, high-affinity binding protein could inhibit <italic>S. passalidarum</italic> adhesion to host cells, or perhaps release individual cells from host interactions or from polymicrobial structures such as biofilms. <xref ref-type="bibr" rid="B83">Wohlbach et al. (2011)</xref> pointed out that the wood-boring-beetle-associated <italic>S. passalidarum</italic> is also a commensal, similar to the typical relationship between humans and many of the fungi described here. However, only two of the SpAls proteins include all NT-Als features (8 Cys, invariant Lys, AFR) that are important for function of <italic>C. albicans</italic> Als3 (<xref ref-type="supplementary-material" rid="ST2"><bold>Supplementary Table S2</bold></xref>; <xref ref-type="supplementary-material" rid="SM10"><bold>Supplementary File S10</bold></xref>; <xref ref-type="fig" rid="f4"><bold>Figure 4</bold></xref>). The long branches associated with the <italic>S. passalidarum</italic> Als sequences in <xref ref-type="fig" rid="f5"><bold>Figure 5</bold></xref> could result from sequence substitutions due to lack of selective pressure or could indicate functional diversification that serves <italic>S. passalidarum</italic> in its ecological niche. The role of the Als proteins in <italic>S. passalidarum</italic> is another topic with many hypotheses for future exploration.</p>
<p>Additional hypotheses to test involve allelic variability and gene expression. Information reported here is limited to one allele from each species. Previous work in <italic>C. albicans</italic> revealed tremendous allelic variation, often involving copy numbers of repeated sequences, but sometimes affecting the NT-Als coding region (reviewed in <xref ref-type="bibr" rid="B33">Hoyer et al., 2008</xref>). Considerable variation is frequently observed between alleles within the same strain of a diploid species (<xref ref-type="bibr" rid="B88">Zhao et al., 2003</xref>; <xref ref-type="bibr" rid="B88">Zhao et al., 2007</xref>). It is reasonable to hypothesize that allelic variation exists among the genes and species described here. It is also reasonable to expect examples of differential gene expression with growth stage and morphology, gene expression variations between strains of the same species, and gene expression patterns that differ between <italic>in vitro</italic> and <italic>in vivo</italic> growth conditions (reviewed in <xref ref-type="bibr" rid="B33">Hoyer et al., 2008</xref>; <xref ref-type="bibr" rid="B10">Coleman et al., 2012</xref>; <xref ref-type="bibr" rid="B21">Gal&#xe1;n-Ladero et al., 2019</xref>; <xref ref-type="bibr" rid="B52">Lombardi et al., 2019</xref>). There are many exciting avenues for investigation as the nature of the <italic>ALS</italic> family continues to be discovered.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>The genome assembly for Lodderomyces elongisporus strain NRRL YB-4239, generated using Illumina MiSeq and Oxford Nanopore MinION data, is available in GenBank under BioProject accession number PRJNA432415, BioSample accession number SAMN08448784, and Genome Assembly accession number GCA_013620985.1 (ASM1362098v1). The genome assembly for Meyerozyma guilliermondii strain ATCC 6260, generated using Illumina MiSeq and Oxford Nanopore MinION data, is available in GenBank under BioProject accession number PRJNA432394, BioSample accession number SAMN08448312, and Genome Assembly accession number GCA_006942155.1 (ASM694215v1). The genome assembly for Scheffersomyces stipitis strain CBS 6054, generated using Illumina MiSeq and Oxford Nanopore MinION data, is available in GenBank under BioProject accession number PRJNA432364, BioSample accession number SAMN08446935, and Genome Assembly accession number GCA_006942115.1 (ASM694211v1). The genome assembly for Spathaspora passalidarum strain NRRL Y-27907, generated using Illumina MiSeq and Oxford Nanopore MinION data, is available in GenBank under BioProject accession number PRJNA432249, BioSample accession number SAMN08439027, and Genome Assembly accession number GCA_013620965.1 (ASM1362096v1).</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author Contributions</title>
<p>LH conceptualized the study, acquired funding, and administered the project. KS, VV, CF, and AH conducted formal analysis. S-HO, AI, RR-B, CF, AH, and LH performed the investigation. CF, AH, and LH developed the study methodology. S-HO, KS, CF, AH, and LH wrote the original draft. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>This work was funded by R15 DE026401 from the National Institute of Dental and Craniofacial Research, National Institutes of Health.</p>
</sec>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack>
<title>Acknowledgments</title>
<p>This article is dedicated to the memory of Professor W. LaJean Chaffin, an outstanding scientist, mentor, and friend. Professor Chaffin shared her enthusiasm for medical mycology with many young researchers and helped them become established investigators. AI and RR-B were part of an Undergraduate Program in Fungal Genomics, which is a collaboration between the University of Illinois at Urbana-Champaign and Millikin University. Other students who contributed to this effort included Kaia Ball, Madeline Batek, Anton Bershanskiy, Stephen DeMartini, Erica Forbes, Zeidy Garcia, Jillian Jones, Jessie Kirk, Mariah McNamer, Deniz Namik, Quinn Nguyen, and Brooke Smith. The authors thank Drs. Travis Wilcoxen and Laura Zimmerman, Millikin University Department of Biology, for coordinating student participation and supervising research credit for students in the program.</p>
</ack>
<sec sec-type="supplementary-material" id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcimb.2021.794529/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcimb.2021.794529/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="DataSheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet_2.docx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet_3.docx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet_4.docx" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="DataSheet_5.docx" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Presentation_1.pptx" id="SM6" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Presentation_2.pptx" id="SM7" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Presentation_3.pptx" id="SM8" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Presentation_4.pptx" id="SM9" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Presentation_5.pptx" id="SM10" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Presentation_6.pptx" id="SM11" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Presentation_7.pptx" id="SM12" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation"/>
<supplementary-material xlink:href="Table_1.docx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
<supplementary-material xlink:href="Table_2.docx" id="ST2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bailey</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Feldmann</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Bovey</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Gow</surname> <given-names>N. A.</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>A. J.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>The <italic>Candida albicans HYR1</italic> Gene, Which is Activated in Response to Hyphal Development, Belongs to a Gene Family Encoding Yeast Cell Wall Proteins</article-title>. <source>J. Bacteriol.</source> <volume>178</volume>, <fpage>5353</fpage>&#x2013;<lpage>5360</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/jb.178.18.5353-5360.1996</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bates</surname> <given-names>S.</given-names>
</name>
<name>
<surname>de la Rosa</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>MacCallum</surname> <given-names>D. M.</given-names>
</name>
<name>
<surname>Brown</surname> <given-names>A. J. P.</given-names>
</name>
<name>
<surname>Gow</surname> <given-names>N. A. R.</given-names>
</name>
<name>
<surname>Odds</surname> <given-names>F. C.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title><italic>Candida albicans</italic> Iff11, a Secreted Protein Required for Cell Wall Structure and Virulence</article-title>. <source>Infect. Immun.</source> <volume>75</volume>, <fpage>2922</fpage>&#x2013;<lpage>2928</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/IAI.00102-07</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bertini</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zoppo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Lombardi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Rizzato</surname> <given-names>C.</given-names>
</name>
<name>
<surname>De Carolis</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Vella</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>Targeted Gene Disruption in <italic>Candida parapsilosis</italic> Demonstrates a Role for <italic>CPAR2_404800</italic> in Adhesion to a Biotic Surface and in a Murine Model of Ascending Urinary Tract Infection</article-title>. <source>Virulence</source> <volume>7</volume>, <fpage>85</fpage>&#x2013;<lpage>97</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/21505594.2015.1112491</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boisram&#xe9;</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Cornu</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Da Costa</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Richard</surname> <given-names>M. L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Unexpected Role for a Serine/Threonine-Rich Domain in the <italic>Candida albicans</italic> Iff Protein Family</article-title>. <source>Eukaryot Cell</source> <volume>10</volume>, <fpage>1317</fpage>&#x2013;<lpage>1330</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/EC.05044-11</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bolger</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Lohse</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Usadel</surname> <given-names>B.</given-names>
</name>
</person-group>. (<year>2014</year>). <article-title>Trimmomatic: A Flexible Trimmer for Illumina Sequence Data</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Butler</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Rasmussen</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>M. F.</given-names>
</name>
<name>
<surname>Santos</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Sakthikumar</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Munro</surname> <given-names>C. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Evolution of Pathogenicity and Sexual Reproduction in Eight <italic>Candida</italic> Genomes</article-title>. <source>Nature</source> <volume>459</volume>, <fpage>657</fpage>&#x2013;<lpage>662</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature08064</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cappellaro</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Baldermann</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Rachel</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Tanner</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Mating Type-Specific Cell-Cell Recognition of <italic>Saccharomyces cerevisiae</italic>: Cell Wall Attachment and Active Sites of a- and &#x3b1;-Agglutinin</article-title>. <source>EMBO J.</source> <volume>20</volume>, <fpage>4737</fpage>&#x2013;<lpage>4744</lpage>. doi: <pub-id pub-id-type="doi">10.1002/j.1460-2075.1994.tb06799.x</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chaffin</surname> <given-names>W. L.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title><italic>Candida albicans</italic> Cell Wall Proteins</article-title>. <source>Microbiol. Mol. Biol. Rev.</source> <volume>72</volume>, <fpage>495</fpage>&#x2013;<lpage>544</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/MMBR.00032-07</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>Z. M.</given-names>
</name>
<name>
<surname>Bobin</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Kahn</surname> <given-names>P. C.</given-names>
</name>
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Structure of <italic>Saccharomyces cerevisiae</italic> Alpha-Agglutinin: Evidence for a Yeast Cell Wall Protein With Multiple Immunoglobulin-Like Domains With Atypical Disulfides</article-title>. <source>J. Biol. Chem.</source> <volume>270</volume>, <fpage>26168</fpage>&#x2013;<lpage>26177</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1074/jbc.270.44.26168</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Coleman</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>S.-H.</given-names>
</name>
<name>
<surname>Manfra-Maretta</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>A Monoclonal Antibody Specific for <italic>Candida albicans</italic> Als4 Demonstrates Overlapping Localization of Als Family Proteins on the Fungal Cell Surface and Highlights Differences Between Als Localization <italic>In Vitro</italic> and <italic>In Vivo</italic></article-title>. <source>FEMS Immunol. Med. Microbiol.</source> <volume>64</volume>, <fpage>321</fpage>&#x2013;<lpage>333</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1574-695X.2011.00914.x</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cook</surname> <given-names>C. E.</given-names>
</name>
<name>
<surname>Bergman</surname> <given-names>M. T.</given-names>
</name>
<name>
<surname>Cochrane</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Apweiler</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Birney</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The European Bioinformatics Institute in 2017: Data Coordination and Integration</article-title>. <source>Nucleic Acids Res.</source> <volume>46</volume>, <fpage>D21</fpage>&#x2013;<lpage>D29</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkx1154</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Douglass</surname> <given-names>A. P.</given-names>
</name>
<name>
<surname>Offei</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Braun-Galleani</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Coughlan</surname> <given-names>A. Y.</given-names>
</name>
<name>
<surname>Martos</surname> <given-names>A. A. R.</given-names>
</name>
<name>
<surname>Ortiz-Merino</surname> <given-names>R. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Population Genomics Shows No Distinction Between Pathogenic <italic>Candida krusei</italic> and Environmental <italic>Pichia kudriavzevii</italic>: One Species, Four Names</article-title>. <source>PLoS Pathog.</source> <volume>14</volume>, <elocation-id>e1007138</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.ppat.1007138</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Du</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Bing</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Ennis</surname> <given-names>C. E.</given-names>
</name>
<name>
<surname>Nobile</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title><italic>Candida auris</italic>: Epidemiology, Biology, Antifungal Resistance, and Virulence</article-title>. <source>PLoS Pathog.</source> <volume>16</volume>, <elocation-id>e1008921</elocation-id>. doi: <pub-id pub-id-type="doi">10.1371/journal.ppat.1008921</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dujon</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Sherman</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Fischer</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Durrens</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Casaregola</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lafontaine</surname> <given-names>I.</given-names>
</name>
<etal/>
</person-group>. (<year>2004</year>). <article-title>Genome Evolution in Yeasts</article-title>. <source>Nature</source> <volume>430</volume>, <fpage>35</fpage>&#x2013;<lpage>44</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature02579</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dunn</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Anderson</surname> <given-names>M. Z.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>To Repeat or Not to Repeat: Repetitive Sequences Regulate Genome Stability in <italic>Candida albicans</italic></article-title>. <source>Genes</source> <volume>10</volume>:<fpage>866</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/genes10110866</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eisenhaber</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Schneider</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Wildpaner</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Eisenhaber</surname> <given-names>F.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>A Sensitive Predictor for Potential GPI Lipid Modification Sites in Fungal Protein Sequences and its Application to Genome-Wide Studies for <italic>Aspergillus nidulans</italic>, <italic>Candida albicans</italic>, <italic>Neurospora crassa</italic>, <italic>Saccharomyces cerevisiae</italic>, and <italic>Schizosaccharmyces pombe</italic></article-title>. <source>J. Mol. Biol.</source> <volume>337</volume>, <fpage>243</fpage>&#x2013;<lpage>253</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jmb.2004.01.025</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fernandes</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Silva-Sousa</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Pereira</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Rito</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Soares</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Franco-Duarte</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Biotechnological Importance of <italic>Torulaspora delbrueckii</italic>: From the Obscurity to the Spotlight</article-title>. <source>J. Fungi</source> <volume>7</volume>:<fpage>712</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jof090712</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fernandez-Escamilla</surname> <given-names>A.-M.</given-names>
</name>
<name>
<surname>Rousseau</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Schymkowitz</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Serrano</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Prediction of Sequence-Dependent and Mutational Effects on the Aggregation of Peptides and Proteins</article-title>. <source>Nat. Biotechnol.</source> <volume>22</volume>, <fpage>1302</fpage>&#x2013;<lpage>1306</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nbt1012</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fran&#xe7;ois</surname> <given-names>F.</given-names>
</name>
<name>
<surname>No&#xeb;l</surname> <given-names>T.</given-names>
</name>
<name>
<surname>P&#xe9;pin</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Brulfert</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Chastin</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Favel</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2001</year>). <article-title>Alternative Identification Test Relying Upon Sexual Reproductive Abilities of <italic>Candida lusitaniae</italic> Strains Isolated From Hospitalized Patients</article-title>. <source>J. Clin. Microbiol.</source> <volume>39</volume>, <fpage>3906</fpage>&#x2013;<lpage>3914</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/JCM.39.11.3906-3914.2001</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gabler</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Nam</surname> <given-names>S. Z.</given-names>
</name>
<name>
<surname>Till</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Mirdita</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Steinegger</surname> <given-names>M.</given-names>
</name>
<name>
<surname>S&#xf6;ding</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Protein Sequence Analysis Using the MPI Bioinformatics Toolkit</article-title>. <source>Curr. Protoc. Bioinf.</source> <volume>72</volume>, <fpage>e108</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/cpbi.108</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gal&#xe1;n-Ladero</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Blanco-Blanco</surname> <given-names>M. T.</given-names>
</name>
<name>
<surname>Fern&#xe1;ndez-Calder&#xf3;n</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Lucio</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Guti&#xe9;rrez-Mart&#xed;n</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Blanco</surname> <given-names>M. T.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title><italic>Candida tropicalis</italic> Biofium Formation and Expression Levels of the <italic>CTRG ALS</italic>-Like Genes in Sessile Cells</article-title>. <source>Yeast</source> <volume>36</volume>, <fpage>107</fpage>&#x2013;<lpage>115</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/yea.3370</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gasteiger</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Hoogland</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Gattiker</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Duvaud</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wilkins</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Appel</surname> <given-names>R. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2005</year>). <article-title>Protein Identification and Analysis Tools on the ExPASy Server</article-title>, In: <person-group person-group-type="editor">
<name>
<surname>Walker</surname> <given-names>J. M.</given-names>
</name>
</person-group> Ed. <source>The Proteomics Protocols Handbook</source> (<publisher-loc>Totowa</publisher-loc>: <publisher-name>Humana Press</publisher-name>), <fpage>571</fpage>&#x2013;<lpage>607</lpage>. doi: <pub-id pub-id-type="doi">10.1385/1-59259-890-0:571</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Geijer</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Faria-Oliveira</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Moreno</surname> <given-names>A. D.</given-names>
</name>
<name>
<surname>Stenberg</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Mazurkewich</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Olsson</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Genomic and Transcriptomic Analysis of <italic>Candida intermedia</italic> Reveals the Genetic Determinants for its Xylose-Converting Capacity</article-title>. <source>Biotechnol. Biofuels</source> <volume>13</volume>, <fpage>48</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1186/s13068-020-1663-9</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goffeau</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Barrell</surname> <given-names>B. G.</given-names>
</name>
<name>
<surname>Bussey</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Davis</surname> <given-names>R. W.</given-names>
</name>
<name>
<surname>Dujon</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Feldmann</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>1996</year>). <article-title>Life With 6000 Genes</article-title>. <source>Science</source> <volume>274</volume>, <fpage>563</fpage>&#x2013;<lpage>567</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.274.5287.546</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gomez-Gaviria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Mora-Montes</surname> <given-names>H. M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Current Aspects in the Biology, Pathogeny, and Treatment of <italic>Candida krusei</italic>, a Neglected Fungal Pathogen</article-title>. <source>Infect. Drug Resist.</source> <volume>13</volume>, <fpage>1673</fpage>&#x2013;<lpage>1689</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2147/IDR.S247944</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goossens</surname> <given-names>K. V. Y.</given-names>
</name>
<name>
<surname>Stassen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Stals</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Donohue</surname> <given-names>D. S.</given-names>
</name>
<name>
<surname>Devreese</surname> <given-names>B.</given-names>
</name>
<name>
<surname>De Greve</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>The N-Terminal Domain of the Flo1 Flocculation Protein From <italic>Saccharomyces cerevisiae</italic> Binds Specifically to Mannose Carbohydrates</article-title>. <source>Eukarot Cell</source> <volume>10</volume>, <fpage>110</fpage>&#x2013;<lpage>117</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/EC.00185-10</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gori</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Knudsen</surname> <given-names>P. B.</given-names>
</name>
<name>
<surname>Nielsen</surname> <given-names>K. F.</given-names>
</name>
<name>
<surname>Arneborg</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Jespersen</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Alcohol-Based Quorum Sensing Plays a Role in Adhesion and Sliding Motility of the Yeast <italic>Debaryomyces hansenii</italic></article-title>. <source>FEMS Yeast. Res.</source> <volume>11</volume>, <fpage>643</fpage>&#x2013;<lpage>652</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1567-1364.2011.00755.x</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Green</surname> <given-names>C. B.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Yeater</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Construction and Real-Time RT-PCR Validation of <italic>Candida albicans</italic> P<italic>ALS</italic>-GFP Reporter Strains and Their Use in Flow Cytometry Analysis of <italic>ALS</italic> Gene Expression in Budding and Filamentous Cells</article-title>. <source>Microbiology</source> <volume>151</volume>, <fpage>1051</fpage>&#x2013;<lpage>1060</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1099/mic.0.27696-0</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grigorescu</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>M.-H.</given-names>
</name>
<name>
<surname>Zhao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Khan</surname> <given-names>P. C.</given-names>
</name>
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>A CD2-Based Model of Yeast Alpha-Agglutinin Elucidates Solution Properties and Binding Characteristics</article-title>. <source>IUBMB Life</source> <volume>50</volume>, <fpage>105</fpage>&#x2013;<lpage>113</lpage>. doi: <pub-id pub-id-type="doi">10.1080/713803692</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guin</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Mishra</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Muzaki</surname> <given-names>S. R. B.</given-names>
</name>
<name>
<surname>Thimmappa</surname> <given-names>B. C.</given-names>
</name>
<name>
<surname>O&#x2019;Brien</surname> <given-names>C. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Spatial Inter-Centromeric Interactions Facilitated the Emergence of Evolutionary New Centromeres</article-title>. <source>Elife</source> <volume>9</volume>, <elocation-id>e58556</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.7554/eLife.58556</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ho</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Herman-Bausier</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Shaw</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Conrad</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Garcia-Sherman</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Draghi</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>An Amyloid Core Sequence in the Major <italic>Candida albicans</italic> Adhesin Als1p Mediates Cell-Cell Adhesion</article-title>. <source>mBio</source> <volume>10</volume>, <fpage>e01766</fpage>&#x2013;<lpage>e01719</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/mBio.01766-19</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
<name>
<surname>Cota</surname> <given-names>E.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title><italic>Candida albicans</italic> Agglutinin-Like Sequence (Als) Family Vignettes: A Review of Als Protein Structure and Function</article-title>. <source>Front. Microbiol.</source> <volume>7</volume>, <elocation-id>280</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2016.00280</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
<name>
<surname>Green</surname> <given-names>C. B.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>S.-H.</given-names>
</name>
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Discovering the Secrets of the <italic>Candida albicans</italic> Agglutinin-Like Sequence (<italic>ALS</italic>) Gene Family &#x2013; a Sticky Pursuit</article-title>. <source>Med. Mycol.</source> <volume>46</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/13693780701435317</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
<name>
<surname>Scherer</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Shatzman</surname> <given-names>A. R.</given-names>
</name>
<name>
<surname>Livi</surname> <given-names>G. P.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title><italic>Candida albicans</italic> ALS1: Domains Related to a <italic>Saccharomyces cerevisiae</italic> Sexual Agglutinin Separated by a Repeating Motif</article-title>. <source>Mol. Microbiol.</source> <volume>15</volume>, <fpage>39</fpage>&#x2013;<lpage>54</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1365-2958.1995</pub-id>. tb02219.x.
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jackson</surname> <given-names>A. P.</given-names>
</name>
<name>
<surname>Gamble</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Yeomans</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Moran</surname> <given-names>G. P.</given-names>
</name>
<name>
<surname>Saunders</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Harris</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2009</year>). <article-title>Comparative Genomics of the Fungal Pathogens <italic>Candida dubliniensis</italic> and <italic>Candida albicans</italic></article-title>. <source>Genome Res.</source> <volume>19</volume>, <fpage>2231</fpage>&#x2013;<lpage>2244</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.097501.109</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jeffries</surname> <given-names>T. W.</given-names>
</name>
<name>
<surname>Grigoriev</surname> <given-names>I. V.</given-names>
</name>
<name>
<surname>Grimwood</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Laplaza</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Aerts</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Salamov</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>). <article-title>Genome Sequence of the Lignocellulose-Bioconverting and Xylose-Fermenting Yeast <italic>Pichia stipitis</italic></article-title>. <source>Nat. Biotechnol.</source> <volume>25</volume>, <fpage>319</fpage>&#x2013;<lpage>326</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nbt1290</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jentoft</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Why are Proteins O-Glycosylated</article-title>? <source>Trends Biochem. Sci.</source> <volume>15</volume>, <fpage>291</fpage>&#x2013;<lpage>294</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/0968-0004(90)90014-3</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jones</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Federspiel</surname> <given-names>N. A.</given-names>
</name>
<name>
<surname>Chibana</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Dungan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kalman</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Magee</surname> <given-names>B. B.</given-names>
</name>
<etal/>
</person-group>. (<year>2004</year>). <article-title>The Diploid Genome Sequence of <italic>Candida albicans</italic></article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>101</volume>, <fpage>7329</fpage>&#x2013;<lpage>7334</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0401648101</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jumper</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Evans</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Pritzel</surname></name>
<name>
<surname>Green</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Figurnov</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Ronneberger</surname> <given-names>O.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Highly Accurate Protein Structure Prediction With AlphaFold</article-title>. <source>Nature</source> <volume>596</volume>, <fpage>583</fpage>&#x2013;<lpage>589</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41586-021-03819-2</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jurardo-Martin</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Marcos-Arias</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Tamayo</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Guridi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>de Groot</surname> <given-names>P. W. J.</given-names>
</name>
<name>
<surname>Quind&#xf3;s</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title><italic>Candida duobushaemulonii</italic>: An Old But Unreported Pathogen</article-title>. <source>J. Fungi</source> <volume>6</volume>, <fpage>374</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jof6040374</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katoh</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Standley</surname> <given-names>D. M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>MAFFT Multiple Sequence Alignment Software Version 7: Improvements in Performance and Usability</article-title>. <source>Mol. Biol. Evol.</source> <volume>30</volume>, <fpage>772</fpage>&#x2013;<lpage>780</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mst010</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Koren</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Walenz</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Berlin</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>Bergman</surname> <given-names>N. H.</given-names>
</name>
<name>
<surname>Phillippy</surname> <given-names>A. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Canu: Scalable and Accurate Long-Read Assembly via Adaptive k-mer Weighting and Repeat Separation</article-title>. <source>Genome Res.</source> <volume>27</volume>, <fpage>722</fpage>&#x2013;<lpage>736</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.215087.116</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kozlov</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Darriba</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Flouri</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Morel</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Stamatakis</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>RAxML-NG: A Fast, Scalable and User-Friendly Tool for Maximum Likelihood Phylogenetic Inference</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>4453</fpage>&#x2013;<lpage>4455</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/btz305</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Minimap2: Pairwise Alignment for Nucleotide Sequences</article-title>. <source>Bioinformatics</source> <volume>34</volume>, <fpage>3094</fpage>&#x2013;<lpage>3100</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty191</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Steenwyk</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Chang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>James</surname> <given-names>T. Y.</given-names>
</name>
<name>
<surname>Stajich</surname> <given-names>J. E.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>A Genome-Scale Phylogeny of the Kingdom Fungi</article-title>. <source>Curr. Biol.</source> <volume>26</volume>, <fpage>1653</fpage>&#x2013;<lpage>1665</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cub.2021.01.074</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>S.-H.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Garnett</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Salgado</surname> <given-names>P. S.</given-names>
</name>
<name>
<surname>Rushnakova</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>The Peptide-Binding Cavity is Essential for Als3-Mediated Adhesion of <italic>Candida albicans</italic> to Human Cells</article-title>. <source>J. Biol. Chem.</source> <volume>289</volume>, <fpage>18401</fpage>&#x2013;<lpage>18412</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1074/jbc.M114.547877</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>What We Do Not Know About Fungal Cell Adhesion Molecules</article-title>. <source>J. Fungi</source> <volume>4</volume>:<fpage>59</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jof4020059</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>M. H.</given-names>
</name>
<name>
<surname>de Nobel</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Kurjan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kahn</surname> <given-names>P. C.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Homology Modeling of an Immunoglobulin-Like Domain in the <italic>Saccharomyces cerevisiae</italic> Adhesion Protein Alpha-Agglutinin</article-title>. <source>Protein Sci.</source> <volume>4</volume>, <fpage>2168</fpage>&#x2013;<lpage>2178</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/pro.5560041023</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
<name>
<surname>Klotz</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Dufrene</surname> <given-names>Y. F.</given-names>
</name>
<name>
<surname>Jackson</surname> <given-names>D. N.</given-names>
</name>
<name>
<surname>Garcia-Sherman</surname> <given-names>M. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Amyloid-Like &#x3b2;-Aggregates as Force-Sensitive Switches in Fungal Biofilms and Infections</article-title>. <source>Microbiol. Mol. Biol. Rev.</source> <volume>82</volume>, <fpage>e00035</fpage>&#x2013;<lpage>e00017</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/MMBR.00035-17</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lockhart</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Etienne</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Vallabhaneni</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Chowdhary</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Govender</surname> <given-names>N. P.</given-names>
</name>
<name>
<surname>Colombo</surname> <given-names>A. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Simultaneous Emergence of Multidrug-Resistant <italic>Candida auris</italic> on 3 Continents Confirmed by Whole-Genome Sequencing and Epidemiological Analyses</article-title>. <source>Clin. Infect. Dis.</source> <volume>64</volume>, <fpage>134</fpage>&#x2013;<lpage>140</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/cid/ciw691</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lockhart</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Messer</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Pfaller</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Diekema</surname> <given-names>D. J.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title><italic>Lodderomyces elongisporus</italic> Masquerading as <italic>Candida parapsilosis</italic> as a Cause of Bloodsream Infections</article-title>. <source>J. Clin. Microbiol.</source> <volume>46</volume>, <fpage>374</fpage>&#x2013;<lpage>376</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/JCM.01790-07</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lombardi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zoppo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Rizzato</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Bottai</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Hernandez</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Characterization of the <italic>Candida orthopsilosis</italic> Agglutinin-Like Sequence (<italic>ALS</italic>) Genes</article-title>. <source>PLoS One</source> <volume>14</volume>, <elocation-id>e0215912</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0215912</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>C. F.</given-names>
</name>
<name>
<surname>Kurjan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>A Pathway for Cell Wall Anchorage of <italic>Saccharomyces cerevisiae</italic> Alpha-Agglutinin</article-title>. <source>Mol. Cell Biol.</source> <volume>14</volume>, <fpage>4825</fpage>&#x2013;<lpage>4833</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/mcb.14.7.4825-4833</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Madeira</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Park</surname> <given-names>Y. M.</given-names>
</name>
<name>
<surname>Lee</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Buso</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Gur</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Madhusoodanan</surname> <given-names>N.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>The EMBL-EBI Search and Sequence Analysis Tools APIs in 2019</article-title>. <source>Nucl. Acids Res.</source> <volume>47</volume>, <fpage>W636</fpage>&#x2013;<lpage>W641</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkz268</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maguire</surname> <given-names>S. L.</given-names>
</name>
<name>
<surname>&#xd3;h&#xc9;igeartaigh</surname> <given-names>S. S.</given-names>
</name>
<name>
<surname>Byrne</surname> <given-names>K. P.</given-names>
</name>
<name>
<surname>Schr&#xf6;der</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>O&#x2019;Gaora</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Wolfe</surname> <given-names>K. H.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Comparative Genome Analysis and Gene Finding in <italic>Candida</italic> Species Using CGOB</article-title>. <source>Mol. Biol. Evol.</source> <volume>30</volume>, <fpage>1281</fpage>&#x2013;<lpage>1291</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/molbev/mst042</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ming</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Lv</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>T.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Revision of the Medically Relevant Species of the Yeast <italic>Genus Diutina</italic></article-title>. <source>Med. Mycol.</source> <volume>57</volume>, <fpage>226</fpage>&#x2013;<lpage>233</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/mmy/myy001</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="other">
<person-group person-group-type="author">
<name>
<surname>Mirdita</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Ovchinnikov</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Steinegger</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>ColabFold &#x2013; Making Protein Folding Accessible to All</article-title>. <source>bioRxiv. preprint.</source> doi:&#xa0;<pub-id pub-id-type="doi">10.1101/2021.08.15.456425</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mortensen</surname> <given-names>H. D.</given-names>
</name>
<name>
<surname>Gori</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Jespersen</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Arneborg</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title><italic>Debaryomyces hansenii</italic> Strains With Different Cell Sizes and Surface Physicochemical Properties Adhere Differently to a Solid Agarose Surface</article-title>. <source>FEMS Microbiol. Lett.</source> <volume>249</volume>, <fpage>165</fpage>&#x2013;<lpage>170</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.femsle.2005.06.009</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mu&#xf1;oz</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Welsh</surname> <given-names>R. M.</given-names>
</name>
<name>
<surname>Shea</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Batra</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Gade</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Howard</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Clade-Specific Chromosomal Rearrangements and Loss of Subtelomeric Adhesins in <italic>Candida auris</italic></article-title>. <source>Genetics</source> <volume>218</volume>, <elocation-id>iyab029</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/genetics/iyab029</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Neale</surname> <given-names>M. N.</given-names>
</name>
<name>
<surname>Glass</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Longley</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Laforce-Nesbitt</surname> <given-names>S. S.</given-names>
</name>
<name>
<surname>Wortzel</surname> <given-names>J. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Role of the Inducible Adhesin CpAls7 in Binding of <italic>Candida parapsilosis</italic> to the Extracellular Matrix Under Fluid Shear</article-title>. <source>Infect. Immun.</source> <volume>86</volume>, <fpage>e00892</fpage>&#x2013;<lpage>e00817</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/IAI.00892-17</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Nielsen</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Predicting Secretory Proteins With SignalP</article-title>,&#x201d; in <source>Protein Function Prediction, Methods in Molecular Biology</source>, vol. <volume>1611</volume>. Ed. <person-group person-group-type="editor">
<name>
<surname>Kihara</surname> <given-names>D.</given-names>
</name>
</person-group> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Humana Press</publisher-name>), <fpage>59</fpage>&#x2013;<lpage>73</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-1-4939-7015-5_6</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oh</surname> <given-names>S.-H.</given-names>
</name>
<name>
<surname>Isenhower</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Rodriguez-Bobadilla</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hubka</surname> <given-names>V.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Pursuing Advances in DNA Sequencing Technology to Solve a Complex Genomic Jigsaw Puzzle: The Agglutinin-Like Sequence (<italic>ALS</italic>) Genes of <italic>Candida tropicalis</italic></article-title>. <source>Front. Microbiol.</source> <volume>11</volume>, <elocation-id>594531</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2020.594531</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oh</surname> <given-names>S.-H.</given-names>
</name>
<name>
<surname>Smith</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Miller</surname> <given-names>A. N.</given-names>
</name>
<name>
<surname>Staker</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Fields</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Hernandez</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Agglutinin-Like Sequence (<italic>ALS</italic>) Genes in the <italic>Candida parapsilosis</italic> Species Complex: Blurring the Boundaries Between Gene Families That Encode Cell-Wall Proteins</article-title>. <source>Front. Microbiol.</source> <volume>10</volume>, <elocation-id>781</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmicb.2019.00781</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Papon</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Savini</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Lanoue</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Simkin</surname> <given-names>A. J.</given-names>
</name>
<name>
<surname>Cr&#xe8;che</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Giglioli-Guivarc&#x2019;h</surname> <given-names>N.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title><italic>Candida guilliermondii</italic>: Biotechnological Applications, Perspectives for Biological Control, Emerging Clinical Importance and Recent Advances in Genetics</article-title>. <source>Curr. Genet.</source> <volume>59</volume>, <fpage>73</fpage>&#x2013;<lpage>90</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s00294-013-0391-0</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Paradis</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Schliep</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>ape 5.0: An Environment for Modern Phylogenetics and Evolutionary Analyses in R</article-title>. <source>Bioinformatics</source> <volume>35</volume>, <fpage>526</fpage>&#x2013;<lpage>528</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bioinformatics/bty633</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peters</surname> <given-names>B. M.</given-names>
</name>
<name>
<surname>Ovchinnikova</surname> <given-names>E. S.</given-names>
</name>
<name>
<surname>Krom</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Schlecht</surname> <given-names>L. M.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2012</year>). <article-title><italic>Staphylococcus aureus</italic> Adherence to <italic>Candida albicans</italic> Hyphae is Mediated by the Hyphal Adhesin Als3p</article-title>. <source>Microbiology</source> <volume>158</volume>, <fpage>2975</fpage>&#x2013;<lpage>2986</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1099/mic.0.062109-0</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Riccombeni</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Vidanes</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Proux.W&#xe9;ra</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Wolfe</surname> <given-names>K. H.</given-names>
</name>
<name>
<surname>Butler</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Sequence and Analysis of the Genome of the Pathogenic Yeast <italic>Candida orthopsilosis</italic></article-title>. <source>PLoS One</source> <volume>7</volume>, <elocation-id>e35750</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal.pone.0035750</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rousseau</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Schymkowitz</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Serrano</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Protein Aggregation and Amyloidosis: Confusion of the Kinds</article-title>? <source>Curr. Opin. Struct. Biol.</source> <volume>16</volume>, <fpage>118</fpage>&#x2013;<lpage>126</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.sbi.2006.01.011</pub-id>
</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ruan</surname> <given-names>S. Y.</given-names>
</name>
<name>
<surname>Chein</surname> <given-names>J. Y.</given-names>
</name>
<name>
<surname>Hou</surname> <given-names>Y. C.</given-names>
</name>
<name>
<surname>Hsueh</surname> <given-names>P. R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Catheter-Related Fungemia Caused by <italic>Candida intermedia</italic></article-title>. <source>Int. J. Infect. Dis.</source> <volume>14</volume>, <fpage>147</fpage>&#x2013;<lpage>149</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.ijid.2009.03.015</pub-id>
</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salgado</surname> <given-names>P. S.</given-names>
</name>
<name>
<surname>Yan</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Taylor</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Burchell</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jones</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Hoyer</surname> <given-names>L. L.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>Structural Basis for the Broad Specificity to Host-Cell Ligands by the Pathogenic Fungus <italic>Candida albicans</italic></article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>108</volume>, <fpage>15775</fpage>&#x2013;<lpage>15779</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1103496108</pub-id>
</citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Santos</surname> <given-names>M. A. S.</given-names>
</name>
<name>
<surname>Gomes</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>Santos</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Carreto</surname> <given-names>L. C.</given-names>
</name>
<name>
<surname>Moura</surname> <given-names>G. R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The Genetic Code of the Fungal CTG Clade</article-title>. <source>C R. Biologies</source> <volume>334</volume>, <fpage>607</fpage>&#x2013;<lpage>611</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cvri.2011.05.008</pub-id>
</citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schoch</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Ciufo</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Domrachev</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hotton</surname> <given-names>C. L.</given-names>
</name>
<name>
<surname>Kannan</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Khovanskaya</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>NCBI Taxonomy: A Comprehensive Update on Curation, Resources and Tools</article-title>. <source>Database</source> <volume>2020</volume>, <elocation-id>baaa062</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/database/baaa062</pub-id>
</citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Senol Cali</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>J. S.</given-names>
</name>
<name>
<surname>Ghose</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Alkan</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Mutlu</surname> <given-names>O.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Nanopore Sequencing Technology and Tools for Genome Assembly: Computational Analysis of the Current State, Bottlenecks and Future Directions</article-title>. <source>Brief. Bioinform.</source> <volume>20</volume>, <fpage>1542</fpage>&#x2013;<lpage>1559</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/bib/bby017</pub-id>
</citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen</surname> <given-names>X.-X.</given-names>
</name>
<name>
<surname>Opulente</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Kominek</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Steenwyk</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Buh</surname> <given-names>K. V.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Tempo and Mode of Genome Evolution in the Budding Yeast Subphylum</article-title>. <source>Cell</source> <volume>175</volume>, <fpage>1533</fpage>&#x2013;<lpage>1545</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.cell.2018.10.023</pub-id>
</citation>
</ref>
<ref id="B75">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Sherman</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Fink</surname> <given-names>G. R.</given-names>
</name>
<name>
<surname>Hicks</surname> <given-names>J. B.</given-names>
</name>
</person-group> (<year>1986</year>). <source>Laboratory Course Manual for Methods in Yeast Genetics</source> (<publisher-loc>Cold Spring Harbor, NY</publisher-loc>: <publisher-name>Cold Spring Harbor Press</publisher-name>).
</citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Skrzypek</surname> <given-names>M. S.</given-names>
</name>
<name>
<surname>Binkley</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Binkley</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Miyasato</surname> <given-names>S. R.</given-names>
</name>
<name>
<surname>Simison</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sherlock</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The <italic>Candida</italic> Genome Database (CGD): Incorporation of Assembly 22, Systematic Identifiers and Visualization of High Throughput Sequencing Data</article-title>. <source>Nucleic Acids Res.</source> <volume>45</volume>, <fpage>D592</fpage>&#x2013;<lpage>D596</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/nar/gkw924</pub-id>
</citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soares</surname> <given-names>E. V.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Flocculation in <italic>Saccharomyces cerevisiae</italic>: A Review</article-title>. <source>J. Appl. Microbiol.</source> <volume>110</volume>, <fpage>1</fpage>&#x2013;<lpage>18</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/j.1365-2672.2010.04897.x</pub-id>
</citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tavanti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Davidson</surname> <given-names>A. D.</given-names>
</name>
<name>
<surname>Gow</surname> <given-names>N. A.</given-names>
</name>
<name>
<surname>Maiden</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Odds</surname> <given-names>F. C.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title><italic>Candida orthopsilosis</italic> and <italic>Candida metapsilosis</italic> spp. nov. Replace <italic>Candida parapsilosis</italic> Groups II and III</article-title>. <source>J. Clin. Microbiol.</source> <volume>43</volume>, <fpage>284</fpage>&#x2013;<lpage>292</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/JCM</pub-id>. 43.1.284-292.2005.
</citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vale-Silva</surname> <given-names>L. A.</given-names>
</name>
<name>
<surname>Sanglard</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Tipping the Balance Both Ways: Drug Resistance and Virulence in <italic>Candida glabrata</italic></article-title>. <source>FEMS Yeast. Res.</source> <volume>15</volume>:<elocation-id>fov025</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/femsyr/fov025</pub-id>
</citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verstrepen</surname> <given-names>K. J.</given-names>
</name>
<name>
<surname>Jansen</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lewitter</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Fink</surname> <given-names>G. R.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Intragenic Tandem Repeats Generate Functional Variability</article-title>. <source>Nat. Genet.</source> <volume>37</volume>, <fpage>986</fpage>&#x2013;<lpage>990</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/ng1618</pub-id>
</citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verstrepen</surname> <given-names>K. J.</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>T. B.</given-names>
</name>
<name>
<surname>Fink</surname> <given-names>G. R.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Origins of Variation in the Fungal Cell Surface</article-title>. <source>Nat. Rev.</source> <volume>2</volume>, <fpage>533</fpage>&#x2013;<lpage>540</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nrmicro927</pub-id>
</citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walker</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Abeel</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Shea</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Priest</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Abouelliel</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sakthikumar</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Pilon: An Integrated Tool for Comprehensive Microbial Variant Detection and Genome Assembly Improvement</article-title>. <source>PLoS One</source> <volume>9</volume>, <fpage>e112963</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1371/journal</pub-id>. pone.0112963.
</citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wohlbach</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Kuo</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Sato</surname> <given-names>T. K.</given-names>
</name>
<name>
<surname>Potts</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Salamov</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Labutti</surname> <given-names>K. M.</given-names>
</name>
<etal/>
</person-group>. (<year>2011</year>). <article-title>Comparative Genomics of Xylose-Fermenting Fungi for Enhanced Biofuel Production</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>108</volume>, <fpage>13212</fpage>&#x2013;<lpage>13217</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.1103039108</pub-id>
</citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wojciechowicz</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>C. F.</given-names>
</name>
<name>
<surname>Kurjan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Cell Surface Anchorage and Ligand-Binding Domains of the <italic>Saccharomyces cerevisiae</italic> Cell Adhesion Protein Alpha-Agglutinin, a Member of the Immunoglobulin Superfamily</article-title>. <source>Mol. Cell. Biol.</source> <volume>13</volume>, <fpage>2554</fpage>&#x2013;<lpage>2563</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/mcb.13.4.2554-2563.1993</pub-id>
</citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Green</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Benoit</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Schatz</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Wheelan</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Cormack</surname> <given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>De Novo Genome Assembly of <italic>Candida glabrata</italic> Reveals Cell Wall Protein Complement and Structure of Dispersed Tandem Repeat Arrays</article-title>. <source>Mol. Microbiol.</source> <volume>113</volume>, <fpage>1209</fpage>&#x2013;<lpage>1224</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/mmi.14488</pub-id>
</citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Green</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Benoit</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Sobel</surname> <given-names>J. D.</given-names>
</name>
<name>
<surname>Schatz</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Wheelan</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Cell Wall Protein Variation, Break-Induced Replication, and Subtelomere Dynamics in <italic>Candida glabrata</italic></article-title>. <source>Mol. Microbiol.</source> <volume>116</volume>, <fpage>260</fpage>&#x2013;<lpage>276</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1111/mmi.14707</pub-id>
</citation>
</ref>
<ref id="B87">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Harrex</surname> <given-names>A. L.</given-names>
</name>
<name>
<surname>Holland</surname> <given-names>B. R.</given-names>
</name>
<name>
<surname>Fenton</surname> <given-names>L. E.</given-names>
</name>
<name>
<surname>Cannon</surname> <given-names>R. D.</given-names>
</name>
<name>
<surname>Schmid</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Sixty Alleles of the <italic>ALS7</italic> Open Reading Frame in <italic>Candida albicans</italic>: <italic>ALS7</italic> is a Hypermutable Contingency Locus</article-title>. <source>Genome Res.</source> <volume>13</volume>, <fpage>2005</fpage>&#x2013;<lpage>2017</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1101/gr.1024903</pub-id>
</citation>
</ref>
<ref id="B88">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>S.-H.</given-names>
</name>
<name>
<surname>Jajko</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Diekema</surname> <given-names>D. J.</given-names>
</name>
<name>
<surname>Pfaller</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Pujol</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2007</year>). <article-title>Analysis of <italic>ALS5</italic> and <italic>ALS6</italic> Allelic Variability in a Geographically Diverse Collection of <italic>Candida albicans</italic> Isolates</article-title>. <source>Fungal Genet. Biol.</source> <volume>44</volume>, <fpage>1298</fpage>&#x2013;<lpage>1309</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.fgb.2007.05.004</pub-id>
</citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>Z.-M.</given-names>
</name>
<name>
<surname>Kahn</surname> <given-names>P. C.</given-names>
</name>
<name>
<surname>Lipke</surname> <given-names>P. N.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Interaction of &#x3b1;-Agglutinin and <bold>a</bold>-Agglutinin, <italic>Saccharomyces cerevisiae</italic> Sexual Cell Adhesion Molecules</article-title>. <source>J. Bacteriol.</source> <volume>183</volume>, <fpage>2874</fpage>&#x2013;<lpage>2880</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1128/JB.183.9.2874-2880.2001</pub-id>
</citation>
</ref>
<ref id="B90">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zimmerman</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Stephens</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Nam</surname> <given-names>S. Z.</given-names>
</name>
<name>
<surname>Rau</surname> <given-names>D.</given-names>
</name>
<name>
<surname>K&#xfc;bler</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lozajic</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>A Completely Reimplemented MPI Bioinformatics Toolkit With a New HHpred Server at its Core</article-title>. <source>J. Mol. Biol.</source> <volume>430</volume>, <fpage>2237</fpage>&#x2013;<lpage>2243</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.jmb.2017.12.007</pub-id>
</citation>
</ref>
<ref id="B91">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zoppo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Di Luca</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Franco</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Rizzato</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lupetti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Stringaro</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>a). <article-title><italic>CpALS4770</italic> and <italic>CpALS4780</italic> Contribution to the Virulence of <italic>Candida parapsilosis</italic></article-title>. <source>Microbiol. Res.</source> <volume>231</volume>, <elocation-id>126351</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.micres.2019.126351</pub-id>
</citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zoppo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Fiorentini</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Rizzato</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Di Luca</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Lupetti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Bottai</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>b). <article-title>Role of <italic>CpALS4780</italic> and <italic>CpALS0660</italic> in <italic>Candida parapsilosis</italic> Virulence: Evidence From a Murine Model of Vaginal Candidiasis</article-title>. <source>J. Fungi</source> <volume>6</volume>:<fpage>86</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/jof6020086</pub-id>
</citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zoppo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Lombardi</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Rizzato</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lupetti</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Bottai</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Papp</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title><italic>CORT0C04210</italic> is Required for <italic>Candida orthopsilosis</italic> Adhesion to Human Buccal Cells</article-title>. <source>Fungal Genet. Biol.</source> <volume>120</volume>, <fpage>19</fpage>&#x2013;<lpage>29</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.fgb.2018.09.001</pub-id>
</citation>
</ref>
<ref id="B94">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zoppo</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Luca</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Villareal</surname> <given-names>S. N.</given-names>
</name>
<name>
<surname>Poma</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Barrasa</surname> <given-names>M. I.</given-names>
</name>
<name>
<surname>Bottai</surname> <given-names>D.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>A CRISPR/Cas9-Based Strategy to Simultaneously Inactivate the Entire <italic>ALS</italic> Gene Family in <italic>Candida orthopsilosis</italic></article-title>. <source>Future Microbiol.</source> <volume>14</volume>, <fpage>1383</fpage>&#x2013;<lpage>1396</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.2217/fmb-2019-0168</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>