<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2022.839524</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Pangenome Analysis of the Soilborne Fungal Phytopathogen <italic>Rhizoctonia solani</italic> and Development of a Comprehensive Web Resource: RsolaniDB</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Kaushik</surname> <given-names>Abhinav</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1605393/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Roberts</surname> <given-names>Daniel P.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/634187/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Ramaprasad</surname> <given-names>Abhinay</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1646244/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mfarrej</surname> <given-names>Sara</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Nair</surname> <given-names>Mridul</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Lakshman</surname> <given-names>Dilip K.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1244390/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Pain</surname> <given-names>Arnab</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/477580/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Biological and Environmental Science and Engineering Division, King Abdullah University of Science and Technology (KAUST)</institution>, <addr-line>Thuwal</addr-line>, <country>Saudi Arabia</country></aff>
<aff id="aff2"><sup>2</sup><institution>Sustainable Agricultural Systems Laboratory, United States Department of Agriculture-Agricultural Research Service (USDA-ARS)</institution>, <addr-line>Beltsville, MD</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>International Institute for Zoonosis Control, Hokkaido University</institution>, <addr-line>Sapporo</addr-line>, <country>Japan</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Matthias Sipiczki, University of Debrecen, Hungary</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Youxiong Que, Fujian Agriculture and Forestry University, China; Gopaljee Jha, National Institute of Plant Genome Research (NIPGR), India</p></fn>
<corresp id="c001">&#x002A;Correspondence: Dilip K. Lakshman, <email>dilip.lakshman@usda.gov</email></corresp>
<corresp id="c002">Arnab Pain, <email>arnab.pain@kaust.edu.sa</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Food Microbiology, a section of the journal Frontiers in Microbiology</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>03</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>13</volume>
<elocation-id>839524</elocation-id>
<history>
<date date-type="received">
<day>20</day>
<month>12</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>02</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2022 Kaushik, Roberts, Ramaprasad, Mfarrej, Nair, Lakshman and Pain.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Kaushik, Roberts, Ramaprasad, Mfarrej, Nair, Lakshman and Pain</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Rhizoctonia solani is a collective group of genetically and pathologically diverse basidiomycetous fungi that damage economically important crops. Its isolates are classified into 13 Anastomosis Groups (AGs) and subgroups having distinctive morphology and host ranges. The genetic factors driving the unique features of <italic>R. solani</italic> pathology are not well characterized due to the limited availability of its annotated genomes. Therefore, we performed genome sequencing, assembly, annotation and functional analysis of 12 <italic>R. solani</italic> isolates covering 7 AGs and select subgroups (AG1-IA; AG1-IB; AG1-IC; AG2-2IIIB; AG3-PT, isolates Rhs 1AP and the hypovirulent Rhs1A1; AG3-TB; AG4-HG-I, isolates Rs23 and R118-11; AG5; AG6; and AG8), in which six genomes are reported for the first time. Using a pangenome comparative analysis of 12 <italic>R. solani</italic> isolates and 15 other Basidiomycetes, we defined the unique and shared secretomes, CAZymes, and effectors across the AGs. We have also elucidated the <italic>R. solani</italic>-derived factors potentially involved in determining AG-specific host preference, and the attributes distinguishing them from other Basidiomycetes. Finally, we present the largest repertoire of <italic>R. solani</italic> genomes and their annotated components as a comprehensive database, viz. RsolaniDB, with tools for large-scale data mining, functional enrichment and sequence analysis not available with other state-of-the-art platforms.</p>
</abstract>
<kwd-group>
<kwd>basidiomycetous fungi</kwd>
<kwd>soilborne plant pathogen</kwd>
<kwd><italic>Rhizoctonia solani</italic></kwd>
<kwd>NGS&#x2014;next generation sequencing</kwd>
<kwd>genomics</kwd>
<kwd>pangenome analyses</kwd>
<kwd>pathogenicity genes</kwd>
<kwd>genome database</kwd>
</kwd-group>
<contract-num rid="cn001">BAS/1/1020-01-01</contract-num>
<contract-num rid="cn002">Agreement #-58-8042-8-067-F</contract-num>
<contract-sponsor id="cn001">King Abdullah University of Science and Technology<named-content content-type="fundref-id">10.13039/501100004052</named-content></contract-sponsor>
<contract-sponsor id="cn002">U.S. Department of Agriculture<named-content content-type="fundref-id">10.13039/100000199</named-content></contract-sponsor>
<counts>
<fig-count count="6"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="80"/>
<page-count count="16"/>
<word-count count="11309"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>Introduction</title>
<p><italic>Rhizoctonia solani</italic> K&#x00FC;hn [teleomorph: <italic>Thanatephorus cucumeris</italic> (Frank) Donk] is considered one of the most destructive soil-borne plant pathogens causing various diseases including pre- and post-emergence damping-off of seedlings, crown and root rots, black scurf of potato, take-all of wheat, sheath blight of rice and maize, brown patch of turf, and postharvest fruit rots (<xref ref-type="bibr" rid="B77">Yang and Li, 2012</xref>; <xref ref-type="bibr" rid="B3">Amaradasa et al., 2013</xref>). This necrotrophic fungus infects a wide range of economically important plant species, belonging to more than 32 plant families and 188 genera, and is responsible for 15&#x2013;50% of agricultural damage annually (<xref ref-type="bibr" rid="B60">Raaijmakers et al., 2009</xref>). Broadly, it is classified among 13 Anastomosis Groups (AGs) with distinctive morphology, physiology, pathogenicity host range, and highly divergent genetic composition (<xref ref-type="bibr" rid="B28">G&#x00F3;nzalez et al., 2016</xref>). Most <italic>R. solani</italic> AGs are further divided into subgroups which differ in pathogenicity, virulence, ability to form sclerotia, growth rate, and host range preference (<xref ref-type="bibr" rid="B40">Keijer et al., 1997</xref>). Although field isolates of <italic>Rhizoctonia</italic> infected plants are usually found to be infested with one or more AGs, each AG subgroup can still have its own host preference. For instance, <italic>Arabidopsis thaliana</italic> was found to be susceptible to AG2-1 sub-group isolates but resistant to AG8 isolates (<xref ref-type="bibr" rid="B25">Foley et al., 2013</xref>), which suggests that genetic divergence is the inherent characteristic of <italic>Rhizoctonia</italic> species.</p>
<p>Over the last two decades, our understanding of the genetic divergence among different <italic>R. solani</italic> AGs has improved to the point that it is now evident that all AGs and their sub-groups are genetically isolated, non-interbreeding populations (<xref ref-type="bibr" rid="B27">Gonzalez et al., 2001</xref>). The rapid and relatively low-cost of generation of genomic sequences and other &#x201C;<italic>omics</italic>&#x201D; datasets has played a significant role in furthering our understanding of the host-pathogen interactions and ecology of <italic>Rhizoctonia</italic> species. (<xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>; <xref ref-type="bibr" rid="B34">Hossain et al., 2014</xref>; <xref ref-type="bibr" rid="B4">Anderson et al., 2016</xref>; <xref ref-type="bibr" rid="B45">Lakshman et al., 2016</xref>; <xref ref-type="bibr" rid="B18">Copley et al., 2017</xref>). The analysis of these genomic sequences and functional components revealed several novel or previously unrecognized classes of <italic>R. solani</italic> genes among different AGs that are involved in pathogenesis in a host-specific manner, e.g., effector proteins and carbohydrate-active enzymes (CAZymes) (<xref ref-type="bibr" rid="B72">Wibberg et al., 2016b</xref>). Additionally, analysis of differentially expressed genes in different isolates has enabled researchers to predict the adaptive behavior of this fungus in different hosts and the associated virulence (<xref ref-type="bibr" rid="B80">Zhang et al., 2017</xref>; <xref ref-type="bibr" rid="B64">Shu et al., 2019</xref>). However, the majority of this information has come from the analysis of isolates belonging to only a small number of AGs for which complete genome and/or transcriptome sequences are available. In fact, until now, draft genome assemblies belonging to only 4 of the 13 AGs have been reported viz. AG1-IA (<xref ref-type="bibr" rid="B57">Nadarajah et al., 2017</xref>; <xref ref-type="bibr" rid="B26">Ghosh et al., 2019</xref>; <xref ref-type="bibr" rid="B46">Lee et al., 2021</xref>), AG1-IB (<xref ref-type="bibr" rid="B74">Wibberg et al., 2015a</xref>,<xref ref-type="bibr" rid="B75">b</xref>), AG2-2IIIB (<xref ref-type="bibr" rid="B72">Wibberg et al., 2016b</xref>), AG3-Rhs1AP (<xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>), AG3-PT isolate Ben-3 (<xref ref-type="bibr" rid="B73">Wibberg et al., 2017</xref>) and AG8 (<xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>). This limited availability of genome sequences and the predicted proteomes across the 13 different AGs and their subgroups is one of the important barriers hindering the understanding of functional complexity and temporal dynamics in <italic>R. solani</italic> AGs and their subgroups.</p>
<p>In this study, we report whole-genome sequencing, assembly and annotation of 12 <italic>Rhizoctonia</italic> isolates from 7 AGs; of which genome sequences of three AGs (AG4, AG5, and AG6), two subgroups (AG1-IC and AG3-TB {or AG3-T5}) and a hypovirulent isolate (AG3-1A1) of the subgroup AG3-PT are being reported for the first time. The draft genome of the AG3-PT isolate 1AP (alternatively named as Rhs1AP) was previously reported (<xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>), but was re-sequenced for comparative purposes, as AG3-1AP. To make these high-quality draft <italic>R. solani</italic> genomes and features readily accessible to a broad audience of researchers, we built a comprehensive and dedicated web resource, viz. RsolaniDB, for hosting and analyzing the available genomic information predicted at the transcript-, and protein-level in different <italic>R. solani</italic> AGs.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Isolation of Genomic DNAs for Sequencing</title>
<p>Details regarding <italic>R. solani</italic> isolates used for sequence analyses are presented in <xref ref-type="supplementary-material" rid="DS1">Supplementary Tables 1</xref>, <xref ref-type="supplementary-material" rid="DS1">2</xref>. Fungal cultures were purified by the hyphal tip excision method (<xref ref-type="bibr" rid="B12">Bills et al., 1993</xref>) and maintained by sub-culturing on potato dextrose agar (PDA; Sigma Aldrich catalog # P2182, St. Louis, MO, United States). The PDA was amended with kanamycin (25 &#x03BC;g/ml) and streptomycin (50 &#x03BC;g/ml) to inhibit bacterial growth. Isolates were grown in potato dextrose broth (PDB; Sigma Aldrich catalog # P6685) at 100 rpm and 25&#x00B0;C for 4&#x2013;6 days, mycelia collected by filtration through 2 layers of sterile cheese cloth, washed 2 X with sterile distilled water, gently squeezed and placed on 4 layers of paper towels to remove surface water, and then snap-frozen in liquid nitrogen and stored at &#x2013;80&#x00B0;C till use. Genomic DNA was extracted from mycelia using both the CTAB method (<xref ref-type="bibr" rid="B17">Carlson et al., 1991</xref>) and a protocol recommended by the manufacturer (User-Developed Protocol: Isolation of genomic DNA from plants and filamentous fungi using the QIAGEN<sup>&#x00AE;</sup> Genomic-tip, Qiagen, Inc., Germantown, MD, United States). RNA was extracted from fungal isolates and from tobacco detached leaves infected with corresponding fungal isolates, using the Qiagen RNeasy Plant Mini Kit (Qiagen, Inc.). Extracted genomic DNA and RNA was quantified with a Qubit Flex Fluorometer (Thermo Fisher Scientific, Waltham, MA, United States). AG and subgroup identity of the fungal isolates was verified by ITS-PCR, sequencing and homology analysis with nucleotide sequences available in the NCBI database (<xref ref-type="bibr" rid="B62">Sayers et al., 2020</xref>).</p>
</sec>
<sec id="S2.SS2">
<title>RNA Extraction</title>
<p><italic>Nicotiana tabacum</italic> seedlings were raised to the four-leaf stage on potting mix (Pro-mix, Premier Horticulture, Quakertown, PA, United States) in the greenhouse at ambient temperature (22&#x00B0;&#x2013;24&#x00B0;C) and 4 h supplemental light with a mercury lamp. Two leaves were excised from each seedling and placed on a tray on two pieces of wet paper towels. For inoculation, seven to eight agar plugs from the margin of fresh <italic>R. solani</italic> growth on 1/4-strength PDA were placed on the adaxial surface of each leaf. Seven to eight non-inoculated agar plugs of 1/4-strength PDA were used as controls. Each tray was covered with a lid and incubated on lab bench at ambient temperature with light as above.</p>
<p>After 5 days, yellow to necrotic symptoms were noticeable on <italic>R. solani</italic> treated leaves but no symptoms appeared on control leaves. The control and infected patches of the leaf were excised with a sterile scalpel, snap frozen in liquid nitrogen and processed for RNA extraction with the RNeasy Plus Mini Kit in RLC buffer (Qiagen, Inc.). The purified RNA was treated with DNase at 37&#x00B0;C for 30 min, extracted with phenol and phenol: chloroform, precipitated with ethanol, and dissolved in RNase-free water.</p>
</sec>
<sec id="S2.SS3">
<title>Construction of Genomic and RNA Libraries and Sequencing</title>
<p>For making genomic libraries, 500 ng of DNA from each sample was sheared with a Covaris sonicator (Covaris E series, Covaris, Inc., Woburn, MA, United States) and paired-end libraries were prepared for sequencing using an Illumina&#x2019;s HiSeq 2000 platform (Illumina, Inc., San Diego, CA, United States). From end repair until adapter ligation and purification steps of the paired-end, libraries were prepared using the protocol &#x201C;Illumina library prep&#x201D; on the IP-Star automated platform (Diagenode IP Star, Diagenode, Inc., Denville, NJ, United States) as per the manufacturer&#x2019;s protocol. Post ligation, manual protocols were used for gel size selection and PCR amplification using the standard Illumina PCR Cycle (Kapa high-fidelity master mix). The prepared libraries were analyzed on a bioanalyzer and quantified using Qubit (Thermo Fisher Scientific). The normalized libraries were pooled for sequencing (insert size of 500 bp) and submitted for HiSeq 2000 sequencing at the Bioscience Core Laboratory of King Abdullah University of Science and Technology.</p>
<p>Strand-specific mRNA sequencing was performed from total RNA using TruSeq Stranded mRNA Sample Prep Kit LT (Illumina, Inc.) according to the manufacturer&#x2019;s instructions. Briefly, polyA+ mRNA was purified from total RNA using oligo-dT dynabead selection. First strand cDNA was synthesized using randomly primed oligos followed by second strand synthesis where dUTPs were incorporated to achieve strand-specificity. The cDNA was adapter-ligated and the libraries amplified by PCR. Libraries were sequenced in an Illumina Hiseq 2000 with paired-end 100 bp read chemistry.</p>
</sec>
<sec id="S2.SS4">
<title><italic>De novo</italic> Assembly, Genome Annotation and Bioinformatic Analysis</title>
<sec id="S2.SS4.SSS1">
<title>Data Preprocessing</title>
<p>Adapter sequences in genomic reads in FASTQ format were trimmed using the trimmomatic tool (version 0.35) (<xref ref-type="bibr" rid="B14">Bolger et al., 2014</xref>), followed by trimming low-quality bases at read ends. Read quality was evaluated using the fastqc tool (version 0.11.8) (Simon <xref ref-type="bibr" rid="B5">Andrews, 2020</xref>). Reads with length &#x003C; 20 bp and average quality score &#x003C; 30 were removed. For genome heterogeneity analysis, <italic>k-mer</italic> distribution analysis on resulting DNAseq reads was performed using jellyfish (version 2.2.10) (<xref ref-type="bibr" rid="B52">Mar&#x00E7;ais and Kingsford, 2011</xref>), which estimated best <italic>k-mer</italic> length for each genome. Histogram distributions of different <italic>k-mers</italic> for the best <italic>k-mer</italic> length were plotted using the <italic>-histo</italic> module of the jellyfish program. In addition, the available raw RNAseq paired-end reads (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 2</xref>) were quality trimmed and preprocessed using the same approach used for DNAseq reads. The quality trimmed reads were then subjected to <italic>de novo</italic> assembly using Trinity which predicted transcript sequences (<xref ref-type="bibr" rid="B29">Grabherr et al., 2011</xref>). These assembled RNAseq transcripts were used for genome assembly, scaffolding and gene prediction purposes.</p>
</sec>
<sec id="S2.SS4.SSS2">
<title>Genome Assembly</title>
<p>Quality trimmed reads were subjected to <italic>de novo</italic> genome assembly using SPAdes (version 3.7.0) in which a defined range of <italic>k-mer</italic> lengths (21, 33, 55, 65, 77, 101, and 111) was used for contig formation (<xref ref-type="bibr" rid="B7">Bankevich et al., 2012</xref>). Quast (version 4.5) was used for quality evaluation of predicted contigs (<xref ref-type="bibr" rid="B30">Gurevich et al., 2013</xref>). Scaffolds were subsequently predicted from contigs using SSPACE (version3.0) (<xref ref-type="bibr" rid="B13">Boetzer et al., 2011</xref>) and gaps in assembled scaffolds filled using five consecutive runs of GapCloser (version 1.12) (<xref ref-type="bibr" rid="B51">Luo et al., 2012</xref>). For samples with a RNAseq dataset available, genome scaffolding was further improved using the Rascaf program (<xref ref-type="bibr" rid="B65">Song et al., 2016</xref>). Genome quality was evaluated with BUSCO (version 3.0.1) (<xref ref-type="bibr" rid="B63">Seppey et al., 2019</xref>) and scaffolds subjected to ITSx (version 1.1) (<xref ref-type="bibr" rid="B10">Bengtsson-Palme et al., 2013</xref>) for ITS sequence prediction. Thereafter, a phylogenetic tree was constructed with megax software (<xref ref-type="bibr" rid="B43">Kumar et al., 2018</xref>) using the neighborhood joining method (10,000 bootstraps), in which ITS2 sequences were aligned using ClustalW (<xref ref-type="bibr" rid="B61">R&#x00E9;dei, 2008</xref>). The resulting tree was saved in the newick format and visualized together using Phylogeny.IO (<xref ref-type="bibr" rid="B37">Jovanovic and Mikheyev, 2019</xref>) and ETE toolkit (<xref ref-type="bibr" rid="B35">Huerta-Cepas et al., 2016</xref>). Redundans python script was then used to predict the homozygous genome by reducing the unwanted redundancy to improve draft genome quality (<xref ref-type="bibr" rid="B58">Pryszcz and Gabald&#x00F3;n, 2016</xref>). Resulting scaffolds were aligned with mitochondrial genomes of <italic>R. solani</italic> and other Basidiomycota using the blastn program (version 2.6.0; <italic>e</italic>-value &#x2264;1e<sup>&#x2013;5</sup>) (<xref ref-type="bibr" rid="B15">Camacho et al., 2009</xref>) and mapped mitochondrial contigs were removed to retain only the nuclear genome for subsequent annotation.</p>
</sec>
<sec id="S2.SS4.SSS3">
<title>Genome Annotation</title>
<p>The draft genome was annotated using the MAKER (version 2.31.8) pipeline (<xref ref-type="bibr" rid="B16">Cantarel et al., 2008</xref>), which predicted intron/exon boundaries, transcript and protein sequences. For the annotation, repeat regions were masked using RepeatMasker (version 4.0.5; model_org = fungi) (<xref ref-type="bibr" rid="B68">Tarailo-Graovac and Chen, 2009</xref>). Protein homology evidence was taken from UniProt protein sequences (Reviewed; family: Basidiomycota) (<xref ref-type="bibr" rid="B9">Bateman et al., 2017</xref>). For EST evidence, RNAseq reads were assembled into transcripts using Trinity <italic>de novo</italic> assembler (version 2.0.6) (<xref ref-type="bibr" rid="B29">Grabherr et al., 2011</xref>). For genomic datasets without corresponding RNAseq datasets available, the EST sequences of alternate organisms were used from previously published <italic>R. solani</italic> genome annotations viz. AG1-IA (<xref ref-type="bibr" rid="B57">Nadarajah et al., 2017</xref>), AG1-IB (<xref ref-type="bibr" rid="B74">Wibberg et al., 2015a</xref>), AG2-2IIIB (<xref ref-type="bibr" rid="B72">Wibberg et al., 2016b</xref>), AG3-Rhs1AP (<xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>), AG3-PT isolate Ben-3 (<xref ref-type="bibr" rid="B73">Wibberg et al., 2017</xref>) and AG8 (<xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>). The functional domains, PANTHER pathways (<xref ref-type="bibr" rid="B56">Mi and Thomas, 2009</xref>) and Gene Ontology (GO) terms (<xref ref-type="bibr" rid="B6">Ashburner et al., 2000</xref>) in the predicted protein sequences were assigned using the InterProScan (version 5.45&#x2013;80.0) standalone program (<xref ref-type="bibr" rid="B59">Quevillon et al., 2005</xref>). The functional domains assigned to each protein included the information from ProSiteProfiles (<xref ref-type="bibr" rid="B36">Hulo et al., 2004</xref>), CDD (<xref ref-type="bibr" rid="B54">Marchler-Bauer et al., 2013</xref>), Pfam (<xref ref-type="bibr" rid="B23">Finn et al., 2014</xref>) and TIGRFAMs (<xref ref-type="bibr" rid="B31">Haft et al., 2003</xref>), resulting in the annotated genome in GFF3 format using iprscan2gff3 and ipr_update_gff programs (<xref ref-type="bibr" rid="B59">Quevillon et al., 2005</xref>).</p>
<p>We also identified the predicted secreted proteins in each of the <italic>R. solani</italic> proteomes using signalp (version 5.0) (<xref ref-type="bibr" rid="B2">Almagro Armenteros et al., 2019</xref>). For identification of proteins with a transmembrane domain, phobius (version 1.01) (<xref ref-type="bibr" rid="B38">K&#x00E4;ll et al., 2007</xref>) was used. We used targetp (version 1.1) to predict proteins with mitochondrial signal peptides (<xref ref-type="bibr" rid="B21">Emanuelsson et al., 2007</xref>). However, since we already removed mitochondrial contigs from assembled genomes, we did not observe any proteins with a mitochondrial signal peptide. Effector proteins in each <italic>R. solani</italic> secretome were predicted using effectorP webserver (version 2.0) (<xref ref-type="bibr" rid="B66">Sperschneider et al., 2016</xref>). The Carbohydrate Active enZymes (CAZyme) in <italic>R. solani</italic> proteomes were predicted using dbCAN2 webserver, in which only the proteins predicted by at least two prediction methods were considered (<xref ref-type="bibr" rid="B79">Zhang et al., 2018</xref>). The CAZyme family predicted by HMMER was used for the selected proteins.</p>
</sec>
<sec id="S2.SS4.SSS4">
<title>Orthology</title>
<p>Orthologous proteins across all proteomes were identified with orthoMCL clustering using the Synima program (<xref ref-type="bibr" rid="B47">Li et al., 2003</xref>; <xref ref-type="bibr" rid="B22">Farrer, 2017</xref>), which identified core, unique and auxiliary regions in each <italic>R. solani</italic> proteome. This program was also used for predicting genome synteny using inter-proteome sequence similarity. ShinyCircos was used for circular visualization of synteny plots (<xref ref-type="bibr" rid="B42">Krzywinski et al., 2009</xref>; <xref ref-type="bibr" rid="B78">Yu et al., 2018</xref>).</p>
</sec>
</sec>
<sec id="S2.SS5">
<title>RsolaniDB Database Development</title>
<p>The RsolaniDB (RDB) database was built to host <italic>R. solani</italic> reference genomes, transcript and protein sequences in FASTA format, along with genome annotations included in GFF3 format. For each genome, the information in the database was structured as entries, in which each entry included a list of details about a given transcript and protein, i.e., intron-exon boundaries; predicted functions; associated pathways and GO terms; predicted sequences; orthologs and functional protein sequence domains predicted from InterPro, PrositeProfile and Pfam. The identifier format for each entry (i.e., RDB ID) starts with &#x201C;RS_&#x201D; and AG subgroup name followed by a unique number. We also included five previously published <italic>R. solani</italic> annotated genome sequences (i.e., AG1-IA, AG1-IB, AG2-2IIIB, AG3-PT and AG8) with their gene identifiers converted into the RDB ID format. The database was written using DHTML and CGI-BIN Perl and MySQL language, to allow users to perform lists of tasks, including a text-based search for the entire database; or in an AG-specific manner. We also included a list of tools to assist users in performing a number of down-stream analyses, including RDB ID to protein/transcript sequence conversion; FASTA sequence-based BLAST search on the entire database or in an AG-specific manner; a tool to retrieve orthologs for a given set of RDB IDs along with tools for functional enrichment analysis. The GO-based functional enrichment tool for gene set analysis of given RDB IDs was built using the topGO R package (<xref ref-type="bibr" rid="B1">Alexa and Rahnenf&#x00FC;hrer, 2009</xref>). Whereas the pathway-based gene set analysis was developed to predict significantly enriched PANTHER pathway IDs for a given set of RDB IDs.</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>Results</title>
<sec id="S3.SS1">
<title>Genome-Wide Comparative Analysis of <italic>Rhizoctonia solani</italic> Assemblies and Its Annotation</title>
<p>We performed high-depth sequencing, <italic>de novo</italic> genome assembly and annotation of 12 <italic>R. solani</italic> isolates. For qualitative evaluation of these assemblies, we used genome sequences of a basidiomycetous mycorrhizal fungus <italic>Tulasnella calospora</italic> (Joint Genome Institute fungal genome portal MycoCosm)<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> and <italic>R. solani</italic> AG3-PT as negative and positive controls, respectively. Overall, the draft genome assemblies of the <italic>R. solani</italic> isolates showed remarkable differences in genome size, ranging anywhere from the smaller AG1-IC (&#x223C;33 Mbp) to the larger AG3-1A1 (&#x223C;71 Mbp) isolate genomes (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 3</xref>). The number of contigs generated were also highly variable ranging from 678 to 11,793, in which the newly reported assemblies of AG1-IC and AG3-T5 had the highest N50 lengths of 100,597 bp and 196,133 bp, respectively (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 3</xref>). The heterogeneity in genomic reads was predicted by analyzing the distribution of different <italic>k-mers</italic> in <italic>R. solani</italic> genomic sequencing reads. The analysis revealed a shoulder peak along with the major peak in <italic>k</italic>-mer frequencies for AG2-2IIIB, AG3-1A1, AG3-1AP and AG8, indicating the possible heterogeneity of these genomic reads of these isolates (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 1</xref>). The G+C content ranged from 47.47 to 49.07%, with a mean of 48.43% (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 3</xref>). The quality of these draft genomes was evaluated using BUSCO with scores ranging between &#x223C;88 and 96% (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 3</xref>), indicating the completeness of essential fungal genes in the predicted assemblies. Among the presented draft genome sequences, a large number of syntenic relationships (<xref ref-type="fig" rid="F1">Figure 1A</xref>) were identified (length &#x003E; 40,000 bp), wherein all the given isolates shared at least four highly similar syntenic regions, except <italic>T. calospora</italic> (outgroup), which did not share any syntenic regions with <italic>R. solani</italic> isolates for the given threshold of &#x003E; 40,000 bp (<xref ref-type="fig" rid="F1">Figure 1B</xref>). The isolates from AG5, AG2-2IIIB and AG3-1A1 shared comparatively lower syntenic regions, whereas AG3-PT (positive control) shared the highest number of syntenic regions with other <italic>R. solani</italic> isolates. In fact, most of the closely related AGs shared a large number of syntenic relationships, e.g., high similarity among AG3 sub-groups. Overall, the analysis exhibited the first line of evidence that indicates widespread collinearity and regions of large similarity across genetically distinct isolates, with <italic>T. calospora</italic> as an outlier.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p><bold>(A)</bold> Circos plot. The Circos plot represents the syntenic relationship between genomes of different AGs of <italic>Rhizoctonia solani</italic> K&#x00FC;hn. Each line represents the region of genomic similarity predicted with Synima. Only the regions with coverage &#x003E; 40,000 bases were enumerated and shown. <bold>(B)</bold> The plot highlights the number of high-similarity syntenic regions (coverage &#x003E; 40,000 bp) shared between each pair of genomes, including <italic>T. calospora</italic>. The red connection represents corresponding isolates sharing a comparatively large number of syntenic relationships relative to other pairs of isolates. Here, self-hits were removed or not shown. <bold>(C)</bold> ITS2 phylogeny. ITS2 sequences of the tester strain were obtained from the NCBI database and were clustered with ITS2 sequences from assembled <italic>R. solani</italic> genomes (highlighted with blue color and &#x002A;), along with ITS2 sequences from previously published <italic>R. solani</italic> genome assemblies (marked with &#x002A;&#x002A;). The phylogenetic tree was constructed using megax software with 10,000 bootstrapping steps (see section &#x201C;Materials and Methods&#x201D;), after which the resulting tree and corresponding alignment were visualized together using Phylogeny.IO.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-13-839524-g001.tif"/>
</fig>
<p>Subsequently, we performed the ITS2-based phylogeny to compare the ITS2 sequences of the 12 newly sequenced <italic>R. solani</italic> isolates with that of the known <italic>R. solani</italic> tester strains (as positive controls) and <italic>T. calospora</italic> as an outgroup (<xref ref-type="fig" rid="F1">Figure 1C</xref>). We were not able to predict ITS sequences for AG3-PT. Phylogenetic clusters of AGs reflected strong similarity in ITS2 sequences of assembled genomes with that of tester strains of <italic>R. solani</italic>. For instance, the AG1-IA cluster includes four strains, all belonging to the same AG, i.e., AG1-IA. Similarly, ITS2 sequences of different AG3 and AG4 subgroups were clustered within their respective clades, whereas the outgroup <italic>T. calospora</italic> showed distinct architecture, providing strong evidence for correct methods being used here for genome assemblies. Intriguingly, ITS2 sequences of the AG8 subgroup showed remarkable differences, where sequence of the tester strain (i.e., AG-8-A68), previously published genome sequence (i.e., AG8-01) and the genome reported here (i.e., AG8-Rh89/T) were clustered across different clades of the phylogenetic tree.</p>
</sec>
<sec id="S3.SS2">
<title>Comparison With Other <italic>Rhizoctonia solani</italic> Assemblies</title>
<p>To evaluate the reliability of the genome assemblies, we compared our draft genomes with previously published assemblies of <italic>R. solani</italic> isolates, i.e., AG1-IA, AG1-IB, AG2-2IIIB, and AG8 (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2</xref>; <xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>; <xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>; <xref ref-type="bibr" rid="B74">Wibberg et al., 2015a</xref>,<xref ref-type="bibr" rid="B72">2016b</xref>,<xref ref-type="bibr" rid="B73">2017</xref>; <xref ref-type="bibr" rid="B57">Nadarajah et al., 2017</xref>; <xref ref-type="bibr" rid="B26">Ghosh et al., 2019</xref>; <xref ref-type="bibr" rid="B46">Lee et al., 2021</xref>). The mummer plot (<xref ref-type="bibr" rid="B53">Mar&#x00E7;ais et al., 2018</xref>) comparison showed the overall co-linearity and high similarity among similar assemblies, wherein AG8 assemblies were least co-linear, possibly due to the heterokaryotic nature of the AG8 genome (<xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>; <xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>). In addition to the above representative assemblies, we found several whole genome assemblies of different AG1 subgroups isolates (<xref ref-type="bibr" rid="B57">Nadarajah et al., 2017</xref>; <xref ref-type="bibr" rid="B26">Ghosh et al., 2019</xref>; <xref ref-type="bibr" rid="B46">Lee et al., 2021</xref>). Among these isolates, we selected two representative assemblies, i.e., AG1-IA-XN.2 (96 scaffolds; NCBI accession: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GCA_015342405.1">GCA_015342405.1</ext-link>) and AG1-IA-RhiXN.1 (16 chromosomes; NCBI accession: <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GCA_016906535.1">GCA_016906535.1</ext-link>), for comparison with our AG1-IA assembly (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 3</xref>). Wherein, the selection of AG1-IA assemblies for comparative analysis is based on the large N50 and genome length of these previously published assemblies. The comparative analysis reveals that, despite the sparse scaffolding of AG1-IA, all the AG1 subgroups shares a large number of syntenic relationships (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures 3A,B</xref>). To gain insight into functional domains of these assemblies, we predicted and compare the InterPro domains of all the AG1 isolates under comparison (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 3C</xref>). Interestingly, all the isolates share a significantly large proportion of functional domains, in which AG1-IA shares more than 70% of the domains with at least one of the three other assemblies. Wherein, all the AG1 assemblies possess WD40 repeats domain with a highest proportion (&#x223C;9&#x2013;10%) as compared to the other Interpro domains (<xref ref-type="supplementary-material" rid="TS1">Supplementary File 1</xref>). Along with a large number of conserved domains, a small percentage of unique functional domains among these assemblies reflects the potential host-specific or isolate-specific functional regions of these assemblies. As expected, the proteomes of these AG1 isolates also shares a large number of orthologous protein clusters (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 3D</xref>), including AG1-IA proteome, which indicates the comparable functional profiles of these assemblies, motivating us to include AG1-IA for further comparative analysis with other sub-groups sequenced in this study.</p>
</sec>
<sec id="S3.SS3">
<title>Genome-Wide Orthologous Protein Clustering and Functional Analysis</title>
<p>Intron/exon and transcript boundaries were identified using the maker pipeline (see section &#x201C;Materials and Methods&#x201D;), which predicted 7,394&#x2013;10,958 protein coding transcripts per genome (excluding <italic>T. calospora</italic>, <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 4</xref>) in which the AG3-1A1 genome had the highest number of transcripts. Next, using OrthoMCL, the translated protein sequences in all genomes were clustered into orthologous groups, where each cluster of proteins represented a set of similar sequences likely to represent a protein family. The similarities among the given isolates were enumerated by measuring proteins shared by different proteomes in the same orthoMCL clusters (<xref ref-type="fig" rid="F2">Figure 2A</xref>). As expected, this analysis clearly outgrouped <italic>T. calospora</italic>, indicating that it has a different protein family composition than <italic>R. solani</italic> isolates. The AG1 and AG4 subgroups, AG3-1A1 and AG3-1AP, showed expected similarities and shared similar clustering profiles while AG3-PT and AG5 showed a divergent profile of protein families with respect to the other AGs studied. A large set of orthoMCL clusters shared proteins from all/most of the <italic>R. solani</italic> isolates which further indicates inherent similarities as well as unique attributes across these pathologically diverse groups of fungi. For instance, more than 1,400 orthoMCL clusters were composed of proteins belonging to only two AGs, whereas &#x003E; 1,500 clusters were composed of proteins from all 13 <italic>R. solani</italic> isolates (including previously reported AG3-PT) and <italic>T. calospora</italic> (<xref ref-type="fig" rid="F2">Figure 2B</xref>). It is expected that these conserved clusters are composed of proteins from core gene families with essential functions, whereas other clusters may contain proteins with unique AG-specific roles (<xref ref-type="fig" rid="F2">Figure 2C</xref>). The analysis revealed that AG1-IC, AG2-2IIIB, AG5, AG6-10EEA and AG8 were composed of a large number of unique proteins (&#x003E;1,000 proteins), whereas AG3-1A1 had the highest number of core and auxiliary proteins. The pair-wise comparison of the number of clusters shared by any two AGs highlighted that AG3-1AP shares the highest number of orthoMCL clusters with AG3-1A1, a sector derived hypo-virulent isolate of AG3-1AP (<xref ref-type="fig" rid="F2">Figure 2D</xref>; <xref ref-type="bibr" rid="B44">Lakshman et al., 1998</xref>). In fact, AG3-1A1 proteins shared a large number of clusters with other AG subgroups too, including AG1-IC, AG6-10EEA, AG2-2IIIB and AG4-R118.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>OrthoMCL clustering of the predicted proteomes in <italic>R. solani</italic> AGs. <bold>(A)</bold> Heatmap showing protein conservation across all sequenced <italic>R. solani</italic> AGs and <italic>T. calospora</italic>. Each row represents one orthoMCL cluster, and color is proportional to the number of protein members shared within a given cluster from the given species (black: no member protein present; red: large number of protein members present). The hierarchical clustering (hclust; method: complete) analysis enumerates the similarities between different fungal isolates based on proteins shared by them across all orthoMCL clusters. <bold>(B)</bold> Cluster frequency. The line plot represents the number of orthoMCL clusters shared by different fungal isolates used in this study. Example, &#x003E; 1,400 orthoMCL clusters are shared by 14 different fungal isolates (including positive and negative controls) used in this study. The bimodal nature of the plot represents high similarities across independent proteomes as large numbers of clusters share protein members from 13 fungal isolates. The red line represents the smoothed curves after averaging out the number of clusters. <bold>(C)</bold> Protein classification based on the orthoMCL clusters. The &#x201C;core&#x201D; proteins represent the sub-set of proteomes (from each <italic>R. solani</italic> AG and <italic>T. calospsora</italic>) with a conserved profile across all the isolates. Similarly, the &#x201C;unique&#x201D; sets represent the isolate-specific protein subset. The rest of the protein subsets make up the &#x201C;Auxiliary&#x201D; proteome which are conserved in a limited number of isolates. <bold>(D)</bold> Shared orthoMCL clusters. The number of orthoMCL clusters shared between any two isolates. A shared cluster means, a given orthoMCL cluster contains proteins from both the isolates.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-13-839524-g002.tif"/>
</fig>
<p>To investigate the functional composition of proteins using orthologous groups, we performed InterPro domain family analysis of proteomes from each AG (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 5</xref>). The core proteome of most AGs was composed of &#x223C;2,000 InterPro domain families, whereas the unique proteome per AG ranged between 101 (for AG3-PT) to 628 (for AG3-1A1) domain families. The most common protein family in the unique proteome of <italic>R. solani</italic> subgroups was &#x201C;Cytochrome P450,&#x201D; which is essential for fungal adaptations to diverse ecological niches (<xref ref-type="bibr" rid="B19">&#x010C;re&#x0161;nar and Petri&#x010D;, 2011</xref>; <xref ref-type="fig" rid="F3">Figure 3</xref>). Proteins with WD40 repeats were found to be the most common in the unique proteome in most AGs. A few of the AG subgroups were found to be enriched with a protein family that was significantly associated with its unique proteome only, possibly being involved in the survival of that AG in respective hosts. For instance, the AG1-IB unique proteome was enriched with &#x201C;NADH: Flavin Oxidoreductase/NADH oxidase (N-terminal),&#x201D; similarly AG3-1A1 was enriched with &#x201C;ABC transporter-like&#x201D; and &#x201C;Aminoacyl-tRNA synthetase (class-II)&#x201D; InterPro domains. Likewise, AG3-PT was found to be uniquely enriched with &#x201C;Ribosomal protein S4/S9&#x201D; and AG3-1A1 was uniquely enriched with &#x201C;Multicopper oxidase (Type 2)&#x201D; and &#x201C;Patatin like phospholipase domain.&#x201D;</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>InterPro domain analysis of the unique proteome. In the unique proteome of each fungal isolate, InterPro protein domain families were predicted using InterProScan (Version 5.45&#x2013;80.0). Only the top five most enriched protein families are shown. The number marks the corresponding annotation of InterPro family domain in the circular bar plot.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-13-839524-g003.tif"/>
</fig>
</sec>
<sec id="S3.SS4">
<title>A Large Proportion of Protein Clusters Are Uniquely Enriched in <italic>Rhizoctonia solani</italic> Proteomes</title>
<p>The unique components of the 12 proteomes associated with this study and their attributes were compared to the six previously reported <italic>R. solani</italic> spp. (i.e., AG1-IA, AG1-IB, AG3-PT, AG3-Rhs1AP, AG3-2IIIB and AG8). The 18 proteomes with a total number of 180,491 protein sequences (including 6 previously reported <italic>R. solani</italic> spp.) were clustered using CD-HIT (similarity threshold = 65%). CD-HIT enumerated 60,441 protein clusters, of which 46,804 clusters (77.43%) included at least one of the protein sequences from the previously reported <italic>R. solani</italic> proteome. Whereas 22.56% of the clusters (i.e., 13,637 non-identical CD-HIT clusters) were only associated with one or more of the 12 <italic>R. solani</italic> isolates reported in this study. The analysis suggests 15.6% (<italic>n</italic> = 18,542 protein sequences) of the total sequences (i.e., <italic>n</italic> = 118,812 from 12 <italic>R. solani</italic> isolates) generated in this study were sequentially non-identical to previously published proteomes, possibly providing novel sequences and functional information for hypothesis development. Therefore, we investigated the Interpro domains predicted in the protein sequences of 13,637 non-identical CD-HIT clusters which elucidated 3,931 unique Interpro domain IDs, among which most enriched protein domains belonged to the WD40 repeat family, protein kinase domain, F-box domain and Zn(2)-C6 fungal type DNA binding domain. Overall, among the 3,931 Interpro domains, 128 domains were not reported in any of the six previously published genomes/proteomes and were exclusively associated with the 12 <italic>R. solani</italic> isolates reported here. The complete list of non-identical CD-HIT clusters along with their protein components, enriched Interpro domains (128 unique and complete list of 3,931 Interpro domain IDs) are available in <xref ref-type="supplementary-material" rid="TS2">Supplementary File 2</xref>.</p>
</sec>
<sec id="S3.SS5">
<title>Predicted Secretome and Effector Proteins</title>
<p>To facilitate host colonization, plant pathogens secrete proteins to host compartments to establish fungal infection (<xref ref-type="bibr" rid="B41">Kim et al., 2016</xref>; <xref ref-type="bibr" rid="B55">McCotter et al., 2016</xref>; <xref ref-type="bibr" rid="B48">Li et al., 2019</xref>). Therefore, we identified the comprehensive set of secreted proteins from the 12 <italic>R. solani</italic> genomes and the <italic>T. calospora</italic> genome. <xref ref-type="fig" rid="F4">Figure 4A</xref> shows the number of secreted proteins identified in each of the genomes, where AG1-IC, AG3-1A1, AG6-10EEA and, AG2-2IIIB contained a large number of proteins in the predicted secretome (<xref ref-type="supplementary-material" rid="TS3">Supplementary File 3</xref>,<xref ref-type="supplementary-material" rid="DS1">Sheets 1</xref>,<xref ref-type="supplementary-material" rid="DS1">2</xref>). Isolates from AG1-IC, AG2-2IIIB and AG8 contained a comparatively larger number of isolate-specific secreted proteins (i.e., secreted proteins in the unique proteome), while isolates from AG3-1AP, AG3-1A1 and AG3-PT contained a comparatively lower number of secreted proteins. Interestingly, InterPro domain analysis of the secreted proteins suggested that the most enriched protein domain in the predicted secretome was &#x201C;cellulose binding domain&#x2014;fungal&#x201D; (<xref ref-type="fig" rid="F4">Figure 4B</xref>) which is essential for degradation of cellulose and xylans (<xref ref-type="bibr" rid="B49">Linder et al., 1995</xref>). In addition, the secretomes were also enriched with proteins containing &#x201C;Glycoside Hydrolase Family 61,&#x201D; &#x201C;Pectate Lyase&#x201D; and &#x201C;multi-copper oxidase family&#x201D; domains. Most of these protein components function in degradation of the plant host cell wall and breaking down the first line of host defense. We observed that certain families of protein domains were enriched within a few AGs only. For instance, &#x201C;aspartic peptidase family A1&#x201D; domain containing proteins, involved in diverse fungal metabolic processes, were mainly enriched in the AG2-2IIIB isolate, similarly the &#x201C;lysine-specific metallo-endopeptidase&#x201D; domain was enriched in AG3-1AP, AG5 and AG8. The AG4-R118 secretome was significantly enriched with proteins belonging to &#x201C;Glycoside Hydrolase Family 28&#x201D; and &#x201C;Peptidase S8 propeptide-proteinase inhibitor I9&#x201D; domains, whereas the AG4-RS23 secretome was composed of &#x201C;NodB homology&#x201D; and &#x201C;alpha/beta hydrolase fold-1&#x201D; domains. Taken together, the analysis indicated that each of the given AG secretomes was significantly enriched with a unique set of protein families that possibly allows a variety of biological functions in different host systems.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>The secreted proteins. <bold>(A)</bold> Number of predicted proteins in the secretome of each fungal isolate (highlighted in yellow). The secreted proteins predicted in the unique proteome of each isolate is highlighted in red. <bold>(B)</bold> Comparative analysis of the top six highly enriched InterPro domains in the secretome. <bold>(C)</bold> Comparative analysis of the total number of secreted proteins predicted in <italic>R. solani</italic> isolates as compared to other basidiomycetes used in this study. <italic>P</italic>-value is computed using the unpaired Wilcoxon-rank sum test. <bold>(D)</bold> Heatmap showing the pairwise comparison of the InterPro terms commonly shared by the secretome of <italic>R. solani</italic> isolates as well as other basidiomycetes. The strong hierarchical clustering of R. solani isolates highlights their functionally unique and distinct secretome profile as compared to other basidiomycetes.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-13-839524-g004.tif"/>
</fig>
<p>To further identify unique and conserved attributes associated with all 13 <italic>R. solani</italic> isolates (including previously published genomic information from the AG3-PT isolate, as positive control), we performed a comparative analysis of their secretomes with the secretomes of 14 other fungi (excluding <italic>T. calospora</italic>), which represented the major taxonomic, pathogenic, ecological, and commercially important (edible fungi) groups within the Division Basidiomycota (<xref ref-type="supplementary-material" rid="DS1">Supplementary Table 4</xref>). We hypothesized that a small set of functionally important proteins, e.g., secreted proteins, in <italic>R. solani</italic> may have unique attributes not observed within the other Basidiomycetes. The number of secreted proteins predicted in <italic>R. solani</italic> AGs were not significantly different with the number of secreted proteins in other Basidiomycetes (<italic>p</italic> = 0.0629; <xref ref-type="fig" rid="F4">Figure 4C</xref>). However, the InterPro domains enriched in the secretome of <italic>R. solani</italic> AGs and other Basidiomycetes were found to be significantly different. Only a limited number of InterPro terms were shared between <italic>R. solani</italic> AGs and other Basidiomycetes, and <italic>R. solani</italic> AGs were functionally closer to each other than to the other Basidiomycetes (<xref ref-type="fig" rid="F4">Figure 4D</xref>), suggesting that <italic>R. solani</italic> secretomes have a unique domain profile. Overall, 565 InterPro terms were found in the secretome of <italic>R. solani</italic>, whereas the other Basidiomycete (including <italic>T. calospora</italic>), secretomes were enriched with 620 terms where 283 InterPro terms were common across both groups of species. There were 282 InterPro terms (50%) uniquely associated with <italic>R. solani</italic>, not observed in the secretome of other Basidiomycetes, and 337 InterPro terms only observed in the secretome of other Basidiomycetes. The <italic>R. solani</italic>-specific 282 InterPro terms included several protein domains belonging to diverse functional groups, e.g., &#x201C;Aspartic peptidase A1 family,&#x201D; &#x201C;Cysteine rich secretory protein related&#x201D; and &#x201C;Polyscaccaride lyase 8&#x201D; domains. Among the domains commonly enriched across both <italic>R. solani</italic> isolates and other Basidiomycetes, we calculated the fold change of difference of domain occurrence in their secretome and enumerated the protein domains with significant differences in <italic>R. solani</italic> as compared to the other Basidiomycetes (<xref ref-type="supplementary-material" rid="TS3">Supplementary File 3</xref>,<xref ref-type="supplementary-material" rid="DS1"> Sheets 1</xref>,<xref ref-type="supplementary-material" rid="DS1">2</xref>). The analysis suggested that proteins with domains like &#x201C;Pectate lyase,&#x201D; &#x201C;Serine amino-peptidase&#x201D; and &#x201C;Lysine-specific metallo-endopeptidase&#x201D; were significantly enriched in <italic>R. solani</italic> secretomes. Similarly, proteins with &#x201C;Hydrophobin&#x201D; and &#x201C;Zinc finger ring-type&#x201D; domains were enriched in the other Basidiomycetes. We believe that the large number of unique functional domains in the secreted proteome of <italic>R. solani</italic> may be functionally relevant, allowing these fungi to survive under diverse conditions, and should be investigated to understand their role in survival.</p>
<p>Although these plant pathogenic fungi secrete a large number of proteins, only a small proportion have been implicated in fungal-plant disease interactions, i.e., effector proteins (<xref ref-type="bibr" rid="B41">Kim et al., 2016</xref>; <xref ref-type="bibr" rid="B55">McCotter et al., 2016</xref>; <xref ref-type="bibr" rid="B48">Li et al., 2019</xref>). Effector proteins can strongly inhibit the activity of host cellular proteases and allow pathogenic fungi to evade host defense mechanisms. Fungal effector proteins are not known for having a conserved family of domains, these proteins typically being of small length (300&#x2013;400 amino acids) and higher cysteine content (<xref ref-type="bibr" rid="B67">Stergiopoulos and de Wit, 2009</xref>; <xref ref-type="bibr" rid="B55">McCotter et al., 2016</xref>; <xref ref-type="bibr" rid="B66">Sperschneider et al., 2016</xref>). Our analysis revealed 75&#x2013;134 predicted effector proteins in <italic>R. solani</italic> genomes, whereas <italic>T. calospora</italic> contained 136 effector proteins (<xref ref-type="fig" rid="F5">Figure 5A</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Effector proteins. <bold>(A)</bold> The number of cysteine rich effector proteins predicted in the predicted secretome of each fungal isolate. <bold>(B)</bold> The proportion of cysteine observed across all the effectors predicted in each isolate. <bold>(C)</bold> Topmost enriched InterPro domains in effector proteins of <italic>Rhizoctonia</italic> species (not <italic>T. calospora</italic>) and other Basidiomycetes (including <italic>T. calospora</italic>). <bold>(D)</bold> The comparative analysis of the distribution of number of effector proteins predicted in <italic>R. solani</italic> AGs as compared to other Basidiomycetes. The <italic>p</italic>-value is computed using the unpaired Wilcoxon-rank sum test.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-13-839524-g005.tif"/>
</fig>
<p>Isolates from AG1-IC contained the highest number of effector proteins (<italic>n</italic> = 134), whereas the isolate from AG3-PT contained a small number of effectors (<italic>n</italic> = 75). On average, isolates contained approximately 100 effector proteins which had a similar proportion of cysteine residues (<xref ref-type="fig" rid="F5">Figure 5B</xref>). The topmost enriched domain among all <italic>R. solani</italic> effector proteins was &#x201C;Pectate lyase&#x201D; followed by &#x201C;thaumatin family&#x201D; of domain containing proteins (<xref ref-type="fig" rid="F5">Figure 5C</xref>; <xref ref-type="supplementary-material" rid="TS3">Supplementary File 3</xref>,<xref ref-type="supplementary-material" rid="DS1">Sheet 3</xref>).</p>
<p>The other Basidiomycetes studied were enriched with a similar number of effector proteins (<italic>p</italic> = 0.14; <xref ref-type="fig" rid="F5">Figures 5C,D</xref>). Effector proteins in <italic>R solani</italic> AGs included proteins belonging to 237 InterPro terms, whereas effector proteins from the other Basidiomycetes (including <italic>T. calospora</italic>) included proteins enriched with 119 terms. We found 173 terms (72%) that were uniquely associated with <italic>R. solani</italic> AGs, in which most abundant terms include IPR001283 (Cystine-rich-secretory-protein related) (<xref ref-type="supplementary-material" rid="TS3">Supplementary File 3</xref>, <xref ref-type="supplementary-material" rid="DS1">Sheet 4</xref>). These unique effectors may play the deciding roles in host recognition and virulence of <italic>Rhizoctonia</italic> pathogens (<xref ref-type="bibr" rid="B76">Yamamoto et al., 2019</xref>; <xref ref-type="bibr" rid="B70">Wei et al., 2020</xref>). Also, 64 InterPro terms were commonly enriched in both groups of effector proteins, wherein &#x201C;Pectate lyase&#x201D; and &#x201C;Glycoside hydrolase family 28&#x201D; were mainly associated with <italic>R. solani</italic> AG subgroups and &#x201C;Hydrophobin&#x201D; was mainly associated with other Basidiomycetes. The complete list of secretome, effector proteins, InterPro domains and associated information are available in <xref ref-type="supplementary-material" rid="TS3">Supplementary File 3</xref>. The complete list includes those predicted secretome and effector proteins, that are already known to be associated with the <italic>Rhizoctonia</italic> secretome (e.g., Ricin domain) but not highlighted above.</p>
</sec>
<sec id="S3.SS6">
<title>Carbohydrate-Active Enzymes</title>
<p>CAZymes are essential for degradation of host plant cells and fungal colonization in the host (<xref ref-type="bibr" rid="B39">Kameshwar et al., 2019</xref>; <xref ref-type="bibr" rid="B8">Barrett et al., 2020</xref>). Using CAZy (Carbohydrate Active Enzyme database) (<xref ref-type="bibr" rid="B50">Lombard et al., 2014</xref>), which contains classified information regarding enzymes involved in complex carbohydrate metabolism, we annotated and compared the distribution of CAZymes in all <italic>R. solani</italic> isolates. Overall, <italic>R. solani</italic> isolates were composed of 383&#x2013;595 high confidence CAZymes, with AG3-1A1 having the largest number of CAZymes (<xref ref-type="fig" rid="F6">Figure 6A</xref>). These predicted CAZymes in <italic>R. solani</italic> AGs were mainly distributed across 177 CAZyme families that can be broadly classified into six major classes of enzymes, i.e., Glycoside Hydrolase (GH), Polysaccharide Lyase (PL), Carbohydrate Esterase (CE), Carbohydrate-binding modules (CBM) and redox enzymes with Auxiliary Activities (AA). Our analysis revealed that GH forms the major class of CAZymes in all fungal species, including <italic>T. calospora</italic> (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures 6</xref>, <xref ref-type="supplementary-material" rid="DS1">7</xref>); this enzyme hydrolyzing glycosidic linkages between carbohydrate and non-carbohydrate moieties or two or more carbohydrate moieties (<xref ref-type="bibr" rid="B33">Henrissat, 1991</xref>). Whereas CBM forms the least abundant class of enzymes enriched in the proteomes of the given isolates. Despite the differences, we observed a similar distribution of the enzyme count in each class of CAZyme across all given isolates.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>CAZymes<bold>. (A)</bold> The number of carbohydrate-metabolizing enzymes (CAZymes) predicted in the proteome of each fungal isolate. <bold>(B)</bold> Heatmap showing the CAZyme conservation across all the <italic>R. solani</italic> AGs and <italic>T. calospora</italic>. Each row represents one CAZyme family of proteins, and color is proportional to the number of protein members shared within a given family from the given species (black: no member protein present; red: large number of protein members present). The hierarchical clustering (hclust; method: complete) enumerates the similarities between different fungal isolates based on proteins shared by them across all CAZyme families. For simplicity only the CAZyme families enriched in more than 50 enzymes across all proteomes are shown.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmicb-13-839524-g006.tif"/>
</fig>
<p>Among the predicted 177 families, only 34 families were abundant (with total enzyme count &#x003E; 50 proteins; <xref ref-type="fig" rid="F6">Figure 6B</xref>) across all the given isolates, i.e., <italic>Rhizoctonia</italic> species and <italic>T. calospora</italic>. These 34 families had a distinct abundance profile in each AG, for instance, proteins from the GH7 family was highly abundant in <italic>T. calospora</italic> as compared to the <italic>R. solani</italic> isolates. Similarly, proteins belonging to PL1_4 were not observed in AG4-R118 and <italic>T. calospora</italic>. We divided these 34 families into three different groups, with respect to their abundance profile in <italic>R. solani</italic> isolates. Group-1 contained CAZymes belonging to GH28, AA9, PL3_2 and AA3_2 families and formed the highly abundant families (total enzyme count &#x003E; 200 proteins) of enzymes in <italic>R. solani</italic> AGs. Similarly, Group-2 contained 11 CAZyme families with enzymes moderately abundant in <italic>R. solani</italic> AGs. Whereas Group-3 contained 19 families with sparsely abundant CAZymes. In all three clusters, AG3-1A1 contained the highest number of CAZymes for most of the 34 families and was significantly enriched with all members of Group-1 families. In fact, the clustering analysis highlighted the similar profiles of AG3-1A1 and AG2-2IIIB, mainly due to a similar distribution of proteins belonging to GH28, AA9, AA3_2 and GH7. In Group-1, although GH28 containing enzymes were abundant in most of the <italic>R. solani</italic> isolates, AG8 contained a limited number of enzymes belonging to this family. Similarly, AA9 and PL3_2 families of enzymes were abundant only in 50% of the isolates and may provide a unique set of functions to the respective isolates. In Group-2 there was a similar distribution of abundance profiles across all isolates, except <italic>T. calospora</italic>, which indicated their probable role in <italic>R. solani</italic> specific functions. For example, CAZymes belonging to AA5_1, GH18 and PL4_1 were enriched in most of the <italic>R. solani</italic> isolates, but not in <italic>T. calospora</italic>. The conserved distribution of CAZyme families in the diverse proteomes of different <italic>R. solani</italic> isolates signified their essential role in fungal activity. Group-3 CAZymes provided unique and distinct profiles to each AG with a limited number of families showing a similar abundance profile. Wherein, <italic>T. calospora</italic> was found to be distinctly abundant in CAZymes belonging to GH5_5, not observed with <italic>R. solani</italic> isolates. These results strongly suggested that <italic>R. solani</italic> isolates share a large proportion of carbohydrate degrading enzymes, in which an isolate-specific CAZyme profile can also be observed (mainly from Group-3). To confirm if the abundance profile was strictly associated with <italic>R. solani</italic> isolates, we performed the comparative analysis with the abundance profile from the 14 other Basidiomycetes. The analysis clearly revealed a distinct CAZyme profile from other Basidiomycetes, in which <italic>R. solani</italic> isolates were phylogenetically grouped into a different cluster (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 8</xref>). The analysis highlighted the families that were uniquely abundant in <italic>R. solani</italic> isolates rather than other Basidiomycetes, e.g., GH28, PL3_2, AA5_1, CE4, GH10, GH62, PL4_1, CE8, PL1_7, PL1_4 and AA7, and as expected, most families belonged to Group-1 and Group-2 of the previous analysis. Among these families, PL3_2, GH62 and CE8 were distinctly expressed in <italic>R. solani</italic> isolates.</p>
</sec>
<sec id="S3.SS7">
<title>RsolaniDB: A <italic>Rhizoctonia solani</italic> Pangenome Database and Its Applications</title>
<p>RDB is a large-scale, integrative repository for hosting the <italic>R. solani</italic> pangenome project with emphasis on supporting data mining and analysis, wherein the genomes and their components can be accessed under three different categories, viz. genomic, ortholog and functional assignment.</p>
<sec id="S3.SS7.SSS1">
<title>Genomes</title>
<p>The genomic content includes draft genome sequences of <italic>R. solani</italic> isolates in FASTA format along with the gene level annotation in GFF3 format. The annotation includes prediction of gene boundaries with introns and exons, as well as their locations on contigs or scaffolds. It also includes the predicted transcribed cDNA sequences and translated protein sequences. This information is vital for those users looking for reference genomes and their annotated components for mapping RNAseq reads. The draft genomes and their annotation can also be downloaded and used for downstream local analysis, e.g., variants calling, SNP, eQTLs analysis and other similar genomic analyses with different bioinformatics methods.</p>
</sec>
<sec id="S3.SS7.SSS2">
<title>Orthologs</title>
<p>Using the orthoMCL clustering on the proteomes of 18 <italic>R. solani</italic> (including previously published genome assemblies), protein sequences were compared and clustered into groups of similar sequences. The sequences not part of any of the clusters, i.e., singletons, and unique to respective isolates were categorized as &#x201C;unique.&#x201D; Whereas the rest of the proteome was categorized either into &#x201C;core&#x201D; or &#x201C;auxiliary&#x201D; groups of orthoMCL clusters. RDB allows users to retrieve this information for each protein entry and the protein ID of other members of its ortholog cluster family, if any.</p>
</sec>
<sec id="S3.SS7.SSS3">
<title>Functional Assignment</title>
<p>This category includes the predicted InterPro protein domains associated with each of the protein entries. RDB also includes GO information associated with each protein, along with PANTHER pathway terms. This information helps in assigning the functional description for each protein entry in the database.</p>
<p>The database is organized to include one unique RDB ID (or entry) for each gene structure, with all the above associated information. The RDB ID allows users to search the genomic coordinates (intron/exon boundaries) with IGV visualization, sequences and its functional annotation, for each gene in each <italic>R. solani</italic> isolate. This information can be retrieved from the database via the &#x201C;text-based&#x201D; or &#x201C;keywords-based&#x201D; search in an AG-specific manner or from the entire database. Users can also perform blast searches of their own nucleotide or protein sequences to the entire database or can target a given AG. Moreover, users can retrieve the set of sequences in FASTA format, for a given list of RDB IDs. One of the important and unique features of RsolaniDB tools allows users to perform functional or gene-set enrichment analysis of given RDB IDs, e.g., Gene Ontology or pathway analysis. This feature is especially useful for analyzing differentially expressed genes after RNAseq data analysis, as it provides the statistical significance (as <italic>p</italic>-values) of different GO/pathway terms enriched in a given set of differentially expressed genes. As far as we know, this feature is unique to RDB with respect to any other existing <italic>Rhizoctonia</italic> resources. However, it requires the user to use reference genome sequences and the annotation file from RDB database for subjecting into the RNAseq data analysis pipeline. As an additional resource, RDB also incorporated previously published (<xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>; <xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>; <xref ref-type="bibr" rid="B71">Wibberg et al., 2016a</xref>; <xref ref-type="bibr" rid="B57">Nadarajah et al., 2017</xref>) genome and transcriptome level information in a single platform with an RDB ID format. The database is publicly available to the scientific community, accessible at <ext-link ext-link-type="uri" xlink:href="http://rsolanidb.kaust.edu.sa/RhDB/index.html">http://rsolanidb.kaust.edu.sa/RhDB/index.html</ext-link>.</p>
</sec>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>Discussion</title>
<p><italic>Rhizoctonia solani</italic> is considered one of the most destructive and diverse groups of soil-borne plant pathogens causing various diseases on a wide range of economically important crops. It is classified into 13 AGs with distinctive pathogenic host ranges and responsiveness to disease control measures. Until now, draft genome assemblies belonging to only four of the 13 AGs had been reported; viz. AG1-IA (<xref ref-type="bibr" rid="B57">Nadarajah et al., 2017</xref>), AG1-IB (<xref ref-type="bibr" rid="B74">Wibberg et al., 2015a</xref>,<xref ref-type="bibr" rid="B75">b</xref>), AG2-2IIIB (<xref ref-type="bibr" rid="B72">Wibberg et al., 2016b</xref>), AG3-Rhs1AP (<xref ref-type="bibr" rid="B20">Cubeta et al., 2014</xref>), AG3-PT isolate Ben-3 (<xref ref-type="bibr" rid="B73">Wibberg et al., 2017</xref>), and AG8 (<xref ref-type="bibr" rid="B32">Hane et al., 2014</xref>). Here we expanded the scope of genetic analysis of the <italic>R. solani</italic> complex by performing comprehensive genome sequencing, assembly, annotation and comparative analysis of 12 <italic>R. solani</italic> isolates. This enabled us to perform pangenome analysis of <italic>R. solani</italic> on 7 AGs (AG1, AG2, AG3, AG4, AG5, AG6, AG8), selected additional sub-groups (AG1-IC, AG3-TB), and a hypovirulent isolate (AG3-1A1). Although the heterokarotic and diploid nature of <italic>Rhizoctonia</italic> species were expected to cause genome assembly challenges (<xref ref-type="bibr" rid="B72">Wibberg et al., 2016b</xref>), we observed a large number of inter-group syntenic regions as well as ITS2-based and protein sequence and domain similarities which highlights the high similarities among the 13 <italic>R. solani</italic> isolates (including AG3-PT) studied. In addition, a large proportion of CD-HIT protein clusters were also found to be conserved in these isolates when compared to the previously reported <italic>R. solani</italic> protein sequences, thus reassuring the data generation, processing pipelines as well as the high quality of the draft genome sequences reported in this study.</p>
<p>To deduce the similarities and unique features of predicted proteomes, we performed a series of comparative analyses that indicated the expected heterogeneity among <italic>R. solani</italic> subgroups with the orchid mycorrhizal fungus <italic>T. calospora</italic> as an outlier. For example, both AG5 and AG2-2IIIB included a large set of unique proteomes as well as secretomes, enriched with InterPro families of proteins that were abundant in these two AGs. Additionally, the proteome of <italic>R. solani</italic> isolates was uniquely and highly enriched with proteins with &#x201C;pectate lyase&#x201D; domains, when compared to other Basidiomycetes. Another finding of potential significance was that the highest number of orthoMCL clusters was shared between AG3-1A1 and AG3-1AP, both isolates belonging to the AG3-PT subgroup. Isolate AG3-1A1 is the sector-derived, hypovirulent isolate of the more virulent isolate, AG3-1AP. Intriguingly, AG3-1A1 has been demonstrated to be a successful biocontrol agent of isolate AG3-1AP in the field (<xref ref-type="bibr" rid="B11">Bernard et al., 2012</xref>). A high degree of overlap in gene function is consistent with competitive niche exclusion as the mechanism of biocontrol. Overall, by using a novel set of genomes, orthoMCL comparative analysis highlighted several unique relationships across the <italic>R. solani</italic> isolates, that may be used by mycologists in disease management strategies.</p>
<p>Secretome analysis revealed several interesting findings that provided unique characteristics to each <italic>R. solani</italic> isolate, e.g., the secretome of AG1-IB and AG3-T5 being uniquely and significantly enriched with three different multi-copper oxidases (type 1/2/3), isolates from both AGs being known to cause foliar diseases. Despite inherent differences, most of the secretomes had similar composition in their significantly enriched protein domains, which mainly included &#x201C;Cellulose-binding domain fungal,&#x201D; &#x201C;Glycoside hydrolase family 61&#x201D; and &#x201C;Pectate lyase.&#x201D; However, the composition was significantly different with respect to other Basidiomycetes and a large number of reported protein families were uniquely associated with multiple <italic>R. solani</italic> isolates. We observed similar findings for the effector proteins, wherein proteins containing &#x201C;Cysteine rich secretory proteins,&#x201D; &#x201C;Pectate lyase&#x201D; and &#x201C;Thaumatin&#x201D; were distinctly abundant in <italic>R. solani</italic> isolates, while &#x201C;Hydrophobin&#x201D; was only abundant in other Basidiomycetes. Similarly, the CAZyme analysis highlighted several unique attributes associated with each <italic>R. solani</italic> species especially AG3-1A1 possessing the CBM1 family of proteins which are linked with degradation of insoluble polysaccharides (<xref ref-type="bibr" rid="B69">Van Bueren et al., 2005</xref>). Several families of CAZymes were not present in <italic>T. calospora</italic>, which is a symbiotic mycorrhizal fungus, and other Basidiomycetes, e.g., GH28, PL3_2, AA5_1 and GH10 (<xref ref-type="bibr" rid="B24">Fochi et al., 2017</xref>). In addition, AG3-1A1 had exceptionally abundant proteins in AA9 and GH28, a feature not observed with any other Basidiomycetes. In contrast, AA3_2 (Group-1) was abundant in most of the Basidiomycetes, including <italic>R. solani</italic>. Overall, data presented in this study were consistent with the hypothesis that AGs and sub-groups of <italic>Rhizoctonia</italic> species are highly heterogeneous, each with unique functional genomic properties, while being conserved in their functional regions with respect to other groups. The unique secretomes, effector and similarly CAZymes profiles of <italic>R. solani</italic> relative to other Basidiomycetes may reflect the ecological and host adaptation strategies and calls for future research to better understand the biology and pathology of this species complex.</p>
<p>Since each of the <italic>R. solani</italic> AGs or subgroups is characterized by a unique heterogeneous profile, we strongly believe that the presented genome assemblies, annotation and comparative analyses available with our web-resource <italic>viz.</italic> RsolaniDB (RDB) will facilitate mycologists and plant pathologists in generating a greater understanding of <italic>R. solani</italic> biology and ecology, and in developing its disease management projects, including drug target discovery and design of future diagnostic tools for its rapid discrimination under indoor and outdoor farming environments.</p>
</sec>
<sec id="S5" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>The processed fastq files and the annotated genome assemblies generated and presented in this study can be found in the online repositories. The name of the repositories and accession numbers can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/arrayexpress/">https://www.ebi.ac.uk/arrayexpress/</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="E-MTAB-9588">E-MTAB-9588</ext-link> <ext-link ext-link-type="uri" xlink:href="https://www.ebi.ac.uk/ena">https://www.ebi.ac.uk/ena</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJEB42614">PRJEB42614</ext-link>.</p>
</sec>
<sec id="S6">
<title>Author Contributions</title>
<p>AK, DL, and AP conceived the study, interpreted the results, and wrote the manuscript. AK performed the bioinformatics analysis and developed the computational pipelines and the database. AR, SM, and MN conducted the molecular experiments, library preparation, and sequencing. DR collected and stored the materials and edited the manuscript. AP and DL supervised the overall project. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="conf1" sec-type="COI-statement">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="pudiscl1" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec id="S7" sec-type="funding-information">
<title>Funding</title>
<p>This project was funded by a USDA-ARS agreement (Agreement #-58-8042-8-067-F) and a KAUST faculty baseline fund (BAS/1/1020-01-01).</p>
</sec>
<ack><p>We thank the members of the Bioscience Core Laboratory (BCL) in KAUST for producing the raw DNA and RNA sequence datasets and Adnan (Ed) Ismaiel, USDA-ARS, SASL, for DNA extraction and fungal culture maintenance. We also thank Drs. Ian Misner and Nadim Alkharouf (Towson University, Towson, MD) for helping during the initial set-up phase of the project. We also thank Arindam Chakraborty and his team members from KAUST for their technical IT support in setting up RsolaniDB database server.</p>
</ack>
<sec id="S9" sec-type="supplementary-material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2022.839524/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmicb.2022.839524/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.pdf" id="DS1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_1.xlsx" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.xlsx" id="TS2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_3.xlsx" id="TS3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alexa</surname> <given-names>A.</given-names></name> <name><surname>Rahnenf&#x00FC;hrer</surname> <given-names>J.</given-names></name></person-group> (<year>2009</year>). <article-title>Gene set enrichment analysis with topGO.</article-title> <source><italic>Bioconductor Improv</italic></source> <volume>27</volume> <fpage>1</fpage>&#x2013;<lpage>26</lpage>.</citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Almagro Armenteros</surname> <given-names>J. J.</given-names></name> <name><surname>Tsirigos</surname> <given-names>K. D.</given-names></name> <name><surname>S&#x00F8;nderby</surname> <given-names>C. K.</given-names></name> <name><surname>Petersen</surname> <given-names>T. N.</given-names></name> <name><surname>Winther</surname> <given-names>O.</given-names></name> <name><surname>Brunak</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>SignalP 5.0 improves signal peptide predictions using deep neural networks.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>37</volume> <fpage>420</fpage>&#x2013;<lpage>423</lpage>. <pub-id pub-id-type="doi">10.1038/s41587-019-0036-z</pub-id> <pub-id pub-id-type="pmid">30778233</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Amaradasa</surname> <given-names>B. S.</given-names></name> <name><surname>Horvath</surname> <given-names>B. J.</given-names></name> <name><surname>Lakshman</surname> <given-names>D. K.</given-names></name> <name><surname>Warnke</surname> <given-names>S. E.</given-names></name></person-group> (<year>2013</year>). <article-title>DNA fingerprinting and anastomosis grouping reveal similar genetic diversity in <italic>Rhizoctonia</italic> species infecting turfgrasses in the transition zone of USA.</article-title> <source><italic>Mycologia</italic></source> <volume>105</volume> <fpage>1190</fpage>&#x2013;<lpage>1201</lpage>. <pub-id pub-id-type="doi">10.3852/12-368</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Anderson</surname> <given-names>J. P.</given-names></name> <name><surname>Hane</surname> <given-names>J. K.</given-names></name> <name><surname>Stoll</surname> <given-names>T.</given-names></name> <name><surname>Pain</surname> <given-names>N.</given-names></name> <name><surname>Hastie</surname> <given-names>M. L.</given-names></name> <name><surname>Kaur</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Proteomic analysis of <italic>Rhizoctonia solani</italic> identifies infection-specific, redox associated proteins and insight into adaptation to different plant hosts.</article-title> <source><italic>Mol. Cell. Proteomics</italic></source> <volume>15</volume> <fpage>1188</fpage>&#x2013;<lpage>1203</lpage>. <pub-id pub-id-type="doi">10.1074/mcp.M115.054502</pub-id> <pub-id pub-id-type="pmid">26811357</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Andrews</surname> <given-names>S.</given-names></name></person-group> (<year>2020</year>). <article-title>Babraham bioinformatics &#x2013; FastQC a quality control tool for high throughput sequence data.</article-title> <source><italic>Soil</italic></source> <volume>5</volume> <fpage>47</fpage>&#x2013;<lpage>81</lpage>. <pub-id pub-id-type="doi">10.1016/0038-0717(73)90093-X</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ashburner</surname> <given-names>M.</given-names></name> <name><surname>Ball</surname> <given-names>C. A.</given-names></name> <name><surname>Blake</surname> <given-names>J. A.</given-names></name> <name><surname>Botstein</surname> <given-names>D.</given-names></name> <name><surname>Butler</surname> <given-names>H.</given-names></name> <name><surname>Cherry</surname> <given-names>J. M.</given-names></name><etal/></person-group> (<year>2000</year>). <article-title>Gene ontology: tool for the unification of biology.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>25</volume> <fpage>25</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1038/75556</pub-id> <pub-id pub-id-type="pmid">10802651</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bankevich</surname> <given-names>A.</given-names></name> <name><surname>Nurk</surname> <given-names>S.</given-names></name> <name><surname>Antipov</surname> <given-names>D.</given-names></name> <name><surname>Gurevich</surname> <given-names>A. A.</given-names></name> <name><surname>Dvorkin</surname> <given-names>M.</given-names></name> <name><surname>Kulikov</surname> <given-names>A. S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>SPAdes: a new genome assembly algorithm and its applications to single-cell sequencing.</article-title> <source><italic>J. Comput. Biol.</italic></source> <volume>19</volume> <fpage>455</fpage>&#x2013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.1089/cmb.2012.0021</pub-id> <pub-id pub-id-type="pmid">22506599</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barrett</surname> <given-names>K.</given-names></name> <name><surname>Jensen</surname> <given-names>K.</given-names></name> <name><surname>Meyer</surname> <given-names>A. S.</given-names></name> <name><surname>Frisvad</surname> <given-names>J. C.</given-names></name> <name><surname>Lange</surname> <given-names>L.</given-names></name></person-group> (<year>2020</year>). <article-title>Fungal secretome profile categorization of CAZymes by function and family corresponds to fungal phylogeny and taxonomy: example <italic>Aspergillus</italic> and <italic>Penicillium</italic>.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>10</volume>:<issue>5158</issue>. <pub-id pub-id-type="doi">10.1038/s41598-020-61907-1</pub-id> <pub-id pub-id-type="pmid">32198418</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bateman</surname> <given-names>A.</given-names></name> <name><surname>Martin</surname> <given-names>M. J.</given-names></name> <name><surname>O&#x2019;Donovan</surname> <given-names>C.</given-names></name> <name><surname>Magrane</surname> <given-names>M.</given-names></name> <name><surname>Alpi</surname> <given-names>E.</given-names></name> <name><surname>Antunes</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>UniProt: the universal protein knowledgebase.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>45</volume> <fpage>D158</fpage>&#x2013;<lpage>D169</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw1099</pub-id> <pub-id pub-id-type="pmid">27899622</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bengtsson-Palme</surname> <given-names>J.</given-names></name> <name><surname>Ryberg</surname> <given-names>M.</given-names></name> <name><surname>Hartmann</surname> <given-names>M.</given-names></name> <name><surname>Branco</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name> <name><surname>Godhe</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Improved software detection and extraction of ITS1 and ITS2 from ribosomal ITS sequences of fungi and other eukaryotes for analysis of environmental sequencing data.</article-title> <source><italic>Methods Ecol. Evol.</italic></source> <volume>4</volume> <fpage>914</fpage>&#x2013;<lpage>919</lpage>. <pub-id pub-id-type="doi">10.1111/2041-210X.12073</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bernard</surname> <given-names>E.</given-names></name> <name><surname>Larkin</surname> <given-names>R. P.</given-names></name> <name><surname>Tavantzis</surname> <given-names>S.</given-names></name> <name><surname>Erich</surname> <given-names>M. S.</given-names></name> <name><surname>Alyokhin</surname> <given-names>A.</given-names></name> <name><surname>Sewell</surname> <given-names>G.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Compost, rapeseed rotation, and biocontrol agents significantly impact soil microbial communities in organic and conventional potato production systems.</article-title> <source><italic>Appl. Soil Ecol.</italic></source> <volume>52</volume> <fpage>29</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.1016/j.apsoil.2011.10.002</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bills</surname> <given-names>G. F.</given-names></name> <name><surname>Singleton</surname> <given-names>L. L.</given-names></name> <name><surname>Mihail</surname> <given-names>J. D.</given-names></name> <name><surname>Rush</surname> <given-names>C. M.</given-names></name></person-group> (<year>1993</year>). <source><italic>Methods for Research on Soilborne Phytopathogenic Fungi.</italic></source> <publisher-loc>Saint Paul, MN</publisher-loc>: <publisher-name>The American Phytopathological Society</publisher-name>. <pub-id pub-id-type="doi">10.2307/3760494</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Boetzer</surname> <given-names>M.</given-names></name> <name><surname>Henkel</surname> <given-names>C. V.</given-names></name> <name><surname>Jansen</surname> <given-names>H. J.</given-names></name> <name><surname>Butler</surname> <given-names>D.</given-names></name> <name><surname>Pirovano</surname> <given-names>W.</given-names></name></person-group> (<year>2011</year>). <article-title>Scaffolding pre-assembled contigs using SSPACE.</article-title> <source><italic>Bioinformatics</italic></source> <volume>27</volume> <fpage>578</fpage>&#x2013;<lpage>579</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq683</pub-id> <pub-id pub-id-type="pmid">21149342</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bolger</surname> <given-names>A. M.</given-names></name> <name><surname>Lohse</surname> <given-names>M.</given-names></name> <name><surname>Usadel</surname> <given-names>B.</given-names></name></person-group> (<year>2014</year>). <article-title>Trimmomatic: a flexible trimmer for Illumina sequence data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>2114</fpage>&#x2013;<lpage>2120</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu170</pub-id> <pub-id pub-id-type="pmid">24695404</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Camacho</surname> <given-names>C.</given-names></name> <name><surname>Coulouris</surname> <given-names>G.</given-names></name> <name><surname>Avagyan</surname> <given-names>V.</given-names></name> <name><surname>Ma</surname> <given-names>N.</given-names></name> <name><surname>Papadopoulos</surname> <given-names>J.</given-names></name> <name><surname>Bealer</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>BLAST+: architecture and applications.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>10</volume>:<issue>421</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-10-421</pub-id> <pub-id pub-id-type="pmid">20003500</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cantarel</surname> <given-names>B. L.</given-names></name> <name><surname>Korf</surname> <given-names>I.</given-names></name> <name><surname>Robb</surname> <given-names>S. M. C.</given-names></name> <name><surname>Parra</surname> <given-names>G.</given-names></name> <name><surname>Ross</surname> <given-names>E.</given-names></name> <name><surname>Moore</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>MAKER: an easy-to-use annotation pipeline designed for emerging model organism genomes.</article-title> <source><italic>Genome Res.</italic></source> <volume>18</volume> <fpage>188</fpage>&#x2013;<lpage>196</lpage>. <pub-id pub-id-type="doi">10.1101/gr.6743907</pub-id> <pub-id pub-id-type="pmid">18025269</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carlson</surname> <given-names>J. E.</given-names></name> <name><surname>Tulsieram</surname> <given-names>L. K.</given-names></name> <name><surname>Glaubitz</surname> <given-names>J. C.</given-names></name> <name><surname>Luk</surname> <given-names>V. W. K.</given-names></name> <name><surname>Kauffeldt</surname> <given-names>C.</given-names></name> <name><surname>Rutledge</surname> <given-names>R.</given-names></name></person-group> (<year>1991</year>). <article-title>Segregation of random amplified DNA markers in F1 progeny of conifers.</article-title> <source><italic>Theor. Appl. Genet.</italic></source> <volume>83</volume> <fpage>194</fpage>&#x2013;<lpage>200</lpage>. <pub-id pub-id-type="doi">10.1007/BF00226251</pub-id> <pub-id pub-id-type="pmid">24202358</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Copley</surname> <given-names>T.</given-names></name> <name><surname>Bayen</surname> <given-names>S.</given-names></name> <name><surname>Jabaji</surname> <given-names>S.</given-names></name></person-group> (<year>2017</year>). <article-title>Biochar amendment modifies expression of soybean and <italic>Rhizoctonia solani</italic> genes leading to increased severity of <italic>Rhizoctonia</italic> foliar blight.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>8</volume>:<issue>221</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2017.00221</pub-id> <pub-id pub-id-type="pmid">28270822</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>&#x010C;re&#x0161;nar</surname> <given-names>B.</given-names></name> <name><surname>Petri&#x010D;</surname> <given-names>&#x0160;</given-names></name></person-group> (<year>2011</year>). <article-title>Cytochrome P450 enzymes in the fungal kingdom.</article-title> <source><italic>Biochim. Biophys. Acta Proteins Proteomics</italic></source> <volume>1814</volume> <fpage>29</fpage>&#x2013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbapap.2010.06.020</pub-id> <pub-id pub-id-type="pmid">20619366</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cubeta</surname> <given-names>M. A.</given-names></name> <name><surname>Thomas</surname> <given-names>E.</given-names></name> <name><surname>Dean</surname> <given-names>R. A.</given-names></name> <name><surname>Jabaji</surname> <given-names>S.</given-names></name> <name><surname>Neate</surname> <given-names>S. M.</given-names></name> <name><surname>Tavantzis</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Draft genome sequence of the plant-pathogenic soil fungus <italic>Rhizoctonia solani</italic> anastomosis group 3 strain Rhs1AP.</article-title> <source><italic>Genome Announc.</italic></source> <volume>2</volume>:<issue>e01072-14</issue>. <pub-id pub-id-type="doi">10.1128/genomeA.01072-14</pub-id> <pub-id pub-id-type="pmid">25359908</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Emanuelsson</surname> <given-names>O.</given-names></name> <name><surname>Brunak</surname> <given-names>S.</given-names></name> <name><surname>von Heijne</surname> <given-names>G.</given-names></name> <name><surname>Nielsen</surname> <given-names>H.</given-names></name></person-group> (<year>2007</year>). <article-title>Locating proteins in the cell using TargetP, SignalP and related tools.</article-title> <source><italic>Nat. Protoc.</italic></source> <volume>2</volume> <fpage>953</fpage>&#x2013;<lpage>971</lpage>. <pub-id pub-id-type="doi">10.1038/nprot.2007.131</pub-id> <pub-id pub-id-type="pmid">17446895</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Farrer</surname> <given-names>R. A.</given-names></name></person-group> (<year>2017</year>). <article-title>Synima: a Synteny imaging tool for annotated genome assemblies.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>18</volume>:<issue>507</issue>. <pub-id pub-id-type="doi">10.1186/s12859-017-1939-7</pub-id> <pub-id pub-id-type="pmid">29162056</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Finn</surname> <given-names>R. D.</given-names></name> <name><surname>Bateman</surname> <given-names>A.</given-names></name> <name><surname>Clements</surname> <given-names>J.</given-names></name> <name><surname>Coggill</surname> <given-names>P.</given-names></name> <name><surname>Eberhardt</surname> <given-names>R. Y.</given-names></name> <name><surname>Eddy</surname> <given-names>S. R.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Pfam: the protein families database.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>42</volume> <fpage>D222</fpage>&#x2013;<lpage>D230</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1223</pub-id> <pub-id pub-id-type="pmid">24288371</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fochi</surname> <given-names>V.</given-names></name> <name><surname>Chitarra</surname> <given-names>W.</given-names></name> <name><surname>Kohler</surname> <given-names>A.</given-names></name> <name><surname>Voyron</surname> <given-names>S.</given-names></name> <name><surname>Singan</surname> <given-names>V. R.</given-names></name> <name><surname>Lindquist</surname> <given-names>E. A.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Fungal and plant gene expression in the <italic>Tulasnella calospora</italic>&#x2013;<italic>Serapias vomeracea</italic> symbiosis provides clues about nitrogen pathways in orchid Mycorrhizas.</article-title> <source><italic>New Phytol.</italic></source> <volume>213</volume> <fpage>365</fpage>&#x2013;<lpage>379</lpage>. <pub-id pub-id-type="doi">10.1111/nph.14279</pub-id> <pub-id pub-id-type="pmid">27859287</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Foley</surname> <given-names>R. C.</given-names></name> <name><surname>Gleason</surname> <given-names>C. A.</given-names></name> <name><surname>Anderson</surname> <given-names>J. P.</given-names></name> <name><surname>Hamann</surname> <given-names>T.</given-names></name> <name><surname>Singh</surname> <given-names>K. B.</given-names></name></person-group> (<year>2013</year>). <article-title>Genetic and genomic analysis of <italic>Rhizoctonia solani</italic> interactions with <italic>Arabidopsis</italic>; evidence of resistance mediated through NADPH oxidases.</article-title> <source><italic>PLoS One</italic></source> <volume>8</volume>:<issue>e56814</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0056814</pub-id> <pub-id pub-id-type="pmid">23451091</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ghosh</surname> <given-names>S.</given-names></name> <name><surname>Mirza</surname> <given-names>N.</given-names></name> <name><surname>Kanwar</surname> <given-names>P.</given-names></name> <name><surname>Tyagi</surname> <given-names>K.</given-names></name> <name><surname>Jha</surname> <given-names>G.</given-names></name></person-group> (<year>2019</year>). <article-title>Genome analysis provides insight about pathogenesis of Indian strains of <italic>Rhizoctonia solani</italic> in rice.</article-title> <source><italic>Funct. Integr. Genomics</italic></source> <volume>19</volume> <fpage>799</fpage>&#x2013;<lpage>810</lpage>. <pub-id pub-id-type="doi">10.1007/s10142-019-00687-y</pub-id> <pub-id pub-id-type="pmid">31102065</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gonzalez</surname> <given-names>D.</given-names></name> <name><surname>Carling</surname> <given-names>D. E.</given-names></name> <name><surname>Kuninaga</surname> <given-names>S.</given-names></name> <name><surname>Vilgalys</surname> <given-names>R.</given-names></name> <name><surname>Cubeta</surname> <given-names>M. A.</given-names></name></person-group> (<year>2001</year>). <article-title>Ribosomal DNA systematics of <italic>Ceratobasidium</italic> and <italic>Thanatephorus</italic> with <italic>Rhizoctonia anamorphs</italic>.</article-title> <source><italic>Mycologia</italic></source> <volume>93</volume> <fpage>1138</fpage>&#x2013;<lpage>1150</lpage>. <pub-id pub-id-type="doi">10.1080/00275514.2001.12063247</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>G&#x00F3;nzalez</surname> <given-names>D.</given-names></name> <name><surname>Rodriguez-Carres</surname> <given-names>M.</given-names></name> <name><surname>Boekhout</surname> <given-names>T.</given-names></name> <name><surname>Stalpers</surname> <given-names>J.</given-names></name> <name><surname>Kuramae</surname> <given-names>E. E.</given-names></name> <name><surname>Nakatani</surname> <given-names>A. K.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Phylogenetic relationships of <italic>Rhizoctonia</italic> fungi within the Cantharellales.</article-title> <source><italic>Fungal Biol.</italic></source> <volume>120</volume> <fpage>603</fpage>&#x2013;<lpage>619</lpage>. <pub-id pub-id-type="doi">10.1016/j.funbio.2016.01.012</pub-id> <pub-id pub-id-type="pmid">27020160</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Yassour</surname> <given-names>M.</given-names></name> <name><surname>Levin</surname> <given-names>J. Z.</given-names></name> <name><surname>Thompson</surname> <given-names>D. A.</given-names></name> <name><surname>Amit</surname> <given-names>I.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome.</article-title> <source><italic>Nat. Biotechnol.</italic></source> <volume>29</volume> <fpage>644</fpage>&#x2013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id> <pub-id pub-id-type="pmid">21572440</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gurevich</surname> <given-names>A.</given-names></name> <name><surname>Saveliev</surname> <given-names>V.</given-names></name> <name><surname>Vyahhi</surname> <given-names>N.</given-names></name> <name><surname>Tesler</surname> <given-names>G.</given-names></name></person-group> (<year>2013</year>). <article-title>QUAST: quality assessment tool for genome assemblies.</article-title> <source><italic>Bioinformatics</italic></source> <volume>29</volume> <fpage>1072</fpage>&#x2013;<lpage>1075</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt086</pub-id> <pub-id pub-id-type="pmid">23422339</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Haft</surname> <given-names>D. H.</given-names></name> <name><surname>Selengut</surname> <given-names>J. D.</given-names></name> <name><surname>White</surname> <given-names>O.</given-names></name></person-group> (<year>2003</year>). <article-title>The TIGRFAMs database of protein families.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>31</volume> <fpage>371</fpage>&#x2013;<lpage>373</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkg128</pub-id> <pub-id pub-id-type="pmid">12520025</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hane</surname> <given-names>J. K.</given-names></name> <name><surname>Anderson</surname> <given-names>J. P.</given-names></name> <name><surname>Williams</surname> <given-names>A. H.</given-names></name> <name><surname>Sperschneider</surname> <given-names>J.</given-names></name> <name><surname>Singh</surname> <given-names>K. B.</given-names></name></person-group> (<year>2014</year>). <article-title>Genome sequencing and comparative genomics of the broad host-range pathogen <italic>Rhizoctonia solani</italic> AG8.</article-title> <source><italic>PLoS Genet.</italic></source> <volume>10</volume>:<issue>e1004281</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1004281</pub-id> <pub-id pub-id-type="pmid">24810276</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Henrissat</surname> <given-names>B.</given-names></name></person-group> (<year>1991</year>). <article-title>A classification of glycosyl hydrolases based on amino acid sequence similarities.</article-title> <source><italic>Biochem. J.</italic></source> <volume>280(Pt. 2)</volume> <fpage>309</fpage>&#x2013;<lpage>316</lpage>. <pub-id pub-id-type="doi">10.1042/bj2800309</pub-id> <pub-id pub-id-type="pmid">1747104</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hossain</surname> <given-names>M. K.</given-names></name> <name><surname>Tze</surname> <given-names>O. S.</given-names></name> <name><surname>Nadarajah</surname> <given-names>K.</given-names></name> <name><surname>Jena</surname> <given-names>K.</given-names></name> <name><surname>Bhuiyan</surname> <given-names>M. A. R.</given-names></name> <name><surname>Ratnam</surname> <given-names>W.</given-names></name></person-group> (<year>2014</year>). <article-title>Identification and validation of sheath blight resistance in rice (<italic>Oryza sativa</italic> L.) cultivars against <italic>Rhizoctonia solani</italic>.</article-title> <source><italic>Can. J. Plant Pathol.</italic></source> <volume>36</volume> <fpage>482</fpage>&#x2013;<lpage>490</lpage>. <pub-id pub-id-type="doi">10.1080/07060661.2014.970577</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huerta-Cepas</surname> <given-names>J.</given-names></name> <name><surname>Serra</surname> <given-names>F.</given-names></name> <name><surname>Bork</surname> <given-names>P.</given-names></name></person-group> (<year>2016</year>). <article-title>ETE 3: reconstruction, analysis, and visualization of phylogenomic data.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>33</volume> <fpage>1635</fpage>&#x2013;<lpage>1638</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msw046</pub-id> <pub-id pub-id-type="pmid">26921390</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hulo</surname> <given-names>N.</given-names></name> <name><surname>Sigrist</surname> <given-names>C. J.</given-names></name> <name><surname>Le Saux</surname> <given-names>V.</given-names></name> <name><surname>Langendijk-Genevaux</surname> <given-names>P. S.</given-names></name> <name><surname>Bordoli</surname> <given-names>L.</given-names></name> <name><surname>Gattiker</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>Recent improvements to the PROSITE database.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>D134</fpage>&#x2013;<lpage>D137</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh044</pub-id> <pub-id pub-id-type="pmid">14681377</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jovanovic</surname> <given-names>N.</given-names></name> <name><surname>Mikheyev</surname> <given-names>A. S.</given-names></name></person-group> (<year>2019</year>). <article-title>Interactive web-based visualization and sharing of phylogenetic trees using phylogeny.IO.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>47</volume> <fpage>W266</fpage>&#x2013;<lpage>W269</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz356</pub-id> <pub-id pub-id-type="pmid">31114886</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>K&#x00E4;ll</surname> <given-names>L.</given-names></name> <name><surname>Krogh</surname> <given-names>A.</given-names></name> <name><surname>Sonnhammer</surname> <given-names>E. L. L.</given-names></name></person-group> (<year>2007</year>). <article-title>Advantages of combined transmembrane topology and signal peptide prediction-the Phobius web server.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>35</volume> <fpage>W429</fpage>&#x2013;<lpage>W432</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkm256</pub-id> <pub-id pub-id-type="pmid">17483518</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kameshwar</surname> <given-names>A. K. S.</given-names></name> <name><surname>Ramos</surname> <given-names>L. P.</given-names></name> <name><surname>Qin</surname> <given-names>W.</given-names></name></person-group> (<year>2019</year>). <article-title>CAZymes-based ranking of fungi (CBRF): an interactive web database for identifying fungi with extrinsic plant biomass degrading abilities.</article-title> <source><italic>Bioresour. Bioprocess.</italic></source> <volume>6</volume>:<issue>51</issue>. <pub-id pub-id-type="doi">10.1186/s40643-019-0286-0</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Keijer</surname> <given-names>J.</given-names></name> <name><surname>Korsman</surname> <given-names>M. G.</given-names></name> <name><surname>Dullemans</surname> <given-names>A. M.</given-names></name> <name><surname>Houterman</surname> <given-names>P. M.</given-names></name> <name><surname>De Bree</surname> <given-names>J.</given-names></name> <name><surname>Van Silfhout</surname> <given-names>C. H.</given-names></name></person-group> (<year>1997</year>). <article-title>In vitro analysis of host plant specificity in <italic>Rhizoctonia solani</italic>.</article-title> <source><italic>Plant Pathol.</italic></source> <volume>46</volume> <fpage>659</fpage>&#x2013;<lpage>669</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-3059.1997.d01-61.x</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>K. T.</given-names></name> <name><surname>Jeon</surname> <given-names>J.</given-names></name> <name><surname>Choi</surname> <given-names>J.</given-names></name> <name><surname>Cheong</surname> <given-names>K.</given-names></name> <name><surname>Song</surname> <given-names>H.</given-names></name> <name><surname>Choi</surname> <given-names>G.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Kingdom-wide analysis of fungal small secreted proteins (SSPs) reveals their potential role in host association.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>7</volume>:<issue>186</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2016.00186</pub-id> <pub-id pub-id-type="pmid">26925088</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krzywinski</surname> <given-names>M.</given-names></name> <name><surname>Schein</surname> <given-names>J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name> <name><surname>Connors</surname> <given-names>J.</given-names></name> <name><surname>Gascoyne</surname> <given-names>R.</given-names></name> <name><surname>Horsman</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Circos: an information aesthetic for comparative genomics.</article-title> <source><italic>Genome Res.</italic></source> <volume>19</volume> <fpage>1639</fpage>&#x2013;<lpage>1645</lpage>. <pub-id pub-id-type="doi">10.1101/gr.092759.109</pub-id> <pub-id pub-id-type="pmid">19541911</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>S.</given-names></name> <name><surname>Stecher</surname> <given-names>G.</given-names></name> <name><surname>Li</surname> <given-names>M.</given-names></name> <name><surname>Knyaz</surname> <given-names>C.</given-names></name> <name><surname>Tamura</surname> <given-names>K.</given-names></name></person-group> (<year>2018</year>). <article-title>MEGA X: molecular evolutionary genetics analysis across computing platforms.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>35</volume> <fpage>1547</fpage>&#x2013;<lpage>1549</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msy096</pub-id> <pub-id pub-id-type="pmid">29722887</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lakshman</surname> <given-names>D. K.</given-names></name> <name><surname>Jian</surname> <given-names>J.</given-names></name> <name><surname>Tavantzis</surname> <given-names>S. M.</given-names></name></person-group> (<year>1998</year>). <article-title>A double-stranded RNA element from a hypovirulent strain of <italic>Rhizoctonia solani</italic> occurs in DNA form and is genetically related to the pentafunctional AROM protein of the shikimate pathway.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>95</volume> <fpage>6425</fpage>&#x2013;<lpage>6429</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.95.11.6425</pub-id> <pub-id pub-id-type="pmid">9600982</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lakshman</surname> <given-names>D. K.</given-names></name> <name><surname>Roberts</surname> <given-names>D. P.</given-names></name> <name><surname>Garrett</surname> <given-names>W. M.</given-names></name> <name><surname>Natarajan</surname> <given-names>S. S.</given-names></name> <name><surname>Darwish</surname> <given-names>O.</given-names></name> <name><surname>Alkharouf</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Proteomic investigation of <italic>Rhizoctonia solani</italic> AG 4 identifies secretome and mycelial proteins with roles in plant cell wall degradation and virulence.</article-title> <source><italic>J. Agric. Food Chem.</italic></source> <volume>64</volume> <fpage>3101</fpage>&#x2013;<lpage>3110</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jafc.5b05735</pub-id> <pub-id pub-id-type="pmid">27019116</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>D.-Y.</given-names></name> <name><surname>Jeon</surname> <given-names>J.</given-names></name> <name><surname>Kim</surname> <given-names>K.-T.</given-names></name> <name><surname>Cheong</surname> <given-names>K.</given-names></name> <name><surname>Song</surname> <given-names>H.</given-names></name> <name><surname>Choi</surname> <given-names>G.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Comparative genome analyses of four rice-infecting <italic>Rhizoctonia solani</italic> isolates reveal extensive enrichment of homogalacturonan modification genes.</article-title> <source><italic>BMC Genomics</italic></source> <volume>22</volume>:<issue>242</issue>. <pub-id pub-id-type="doi">10.1186/s12864-021-07549-7</pub-id> <pub-id pub-id-type="pmid">33827423</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>L.</given-names></name> <name><surname>Stoeckert</surname> <given-names>C. J.</given-names></name> <name><surname>Roos</surname> <given-names>D. S.</given-names></name></person-group> (<year>2003</year>). <article-title>OrthoMCL: identification of ortholog groups for eukaryotic genomes.</article-title> <source><italic>Genome Res.</italic></source> <volume>13</volume> <fpage>2178</fpage>&#x2013;<lpage>2189</lpage>. <pub-id pub-id-type="doi">10.1101/gr.1224503</pub-id> <pub-id pub-id-type="pmid">12952885</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>T.</given-names></name> <name><surname>Wu</surname> <given-names>Y.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Gao</surname> <given-names>H.</given-names></name> <name><surname>Gupta</surname> <given-names>V. K.</given-names></name> <name><surname>Duan</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Secretome profiling reveals virulence-associated proteins of <italic>Fusarium proliferatum</italic> during interaction with banana fruit.</article-title> <source><italic>Biomolecules</italic></source> <volume>9</volume>:<issue>246</issue>. <pub-id pub-id-type="doi">10.3390/biom9060246</pub-id> <pub-id pub-id-type="pmid">31234604</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Linder</surname> <given-names>M.</given-names></name> <name><surname>Lindeberg</surname> <given-names>G.</given-names></name> <name><surname>Reinikainen</surname> <given-names>T.</given-names></name> <name><surname>Teeri</surname> <given-names>T. T.</given-names></name> <name><surname>Pettersson</surname> <given-names>G.</given-names></name></person-group> (<year>1995</year>). <article-title>The difference in affinity between two fungal cellulose-binding domains is dominated by a single amino acid substitution.</article-title> <source><italic>FEBS Lett.</italic></source> <volume>372</volume> <fpage>96</fpage>&#x2013;<lpage>98</lpage>. <pub-id pub-id-type="doi">10.1016/0014-5793(95)00961-8</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lombard</surname> <given-names>V.</given-names></name> <name><surname>Golaconda Ramulu</surname> <given-names>H.</given-names></name> <name><surname>Drula</surname> <given-names>E.</given-names></name> <name><surname>Coutinho</surname> <given-names>P. M.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name></person-group> (<year>2014</year>). <article-title>The carbohydrate-active enzymes database (CAZy) in 2013.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>42</volume> <fpage>D490</fpage>&#x2013;<lpage>D495</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1178</pub-id> <pub-id pub-id-type="pmid">24270786</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luo</surname> <given-names>R.</given-names></name> <name><surname>Liu</surname> <given-names>B.</given-names></name> <name><surname>Xie</surname> <given-names>Y.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>W.</given-names></name> <name><surname>Yuan</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>SOAPdenovo2: an empirically improved memory-efficient short-read de novo assembler.</article-title> <source><italic>Gigascience</italic></source> <volume>1</volume>:<issue>18</issue>. <pub-id pub-id-type="doi">10.1186/2047-217X-1-18</pub-id> <pub-id pub-id-type="pmid">23587118</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x00E7;ais</surname> <given-names>G.</given-names></name> <name><surname>Kingsford</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>A fast, lock-free approach for efficient parallel counting of occurrences of k-mers.</article-title> <source><italic>Bioinformatics</italic></source> <volume>27</volume> <fpage>764</fpage>&#x2013;<lpage>770</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr011</pub-id> <pub-id pub-id-type="pmid">21217122</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x00E7;ais</surname> <given-names>G.</given-names></name> <name><surname>Delcher</surname> <given-names>A. L.</given-names></name> <name><surname>Phillippy</surname> <given-names>A. M.</given-names></name> <name><surname>Coston</surname> <given-names>R.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name> <name><surname>Zimin</surname> <given-names>A.</given-names></name></person-group> (<year>2018</year>). <article-title>MUMmer4: a fast and versatile genome alignment system.</article-title> <source><italic>PLoS Comput. Biol.</italic></source> <volume>14</volume>:<issue>e1005944</issue>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1005944</pub-id> <pub-id pub-id-type="pmid">29373581</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Marchler-Bauer</surname> <given-names>A.</given-names></name> <name><surname>Zheng</surname> <given-names>C.</given-names></name> <name><surname>Chitsaz</surname> <given-names>F.</given-names></name> <name><surname>Derbyshire</surname> <given-names>M. K.</given-names></name> <name><surname>Geer</surname> <given-names>L. Y.</given-names></name> <name><surname>Geer</surname> <given-names>R. C.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>CDD: conserved domains and protein three-dimensional structure.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>41</volume> <fpage>D348</fpage>&#x2013;<lpage>D352</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gks1243</pub-id> <pub-id pub-id-type="pmid">23197659</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McCotter</surname> <given-names>S. W.</given-names></name> <name><surname>Horianopoulos</surname> <given-names>L. C.</given-names></name> <name><surname>Kronstad</surname> <given-names>J. W.</given-names></name></person-group> (<year>2016</year>). <article-title>Regulation of the fungal secretome.</article-title> <source><italic>Curr. Genet.</italic></source> <volume>62</volume> <fpage>533</fpage>&#x2013;<lpage>545</lpage>. <pub-id pub-id-type="doi">10.1007/s00294-016-0578-2</pub-id> <pub-id pub-id-type="pmid">26879194</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mi</surname> <given-names>H.</given-names></name> <name><surname>Thomas</surname> <given-names>P.</given-names></name></person-group> (<year>2009</year>). <article-title>PANTHER pathway: an ontology-based pathway database coupled with data analysis tools.</article-title> <source><italic>Methods Mol. Biol.</italic></source> <volume>563</volume> <fpage>123</fpage>&#x2013;<lpage>140</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-60761-175-2_7</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nadarajah</surname> <given-names>K.</given-names></name> <name><surname>Razali</surname> <given-names>N. M.</given-names></name> <name><surname>Cheah</surname> <given-names>B. H.</given-names></name> <name><surname>Sahruna</surname> <given-names>N. S.</given-names></name> <name><surname>Ismail</surname> <given-names>I.</given-names></name> <name><surname>Tathode</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Draft genome sequence of <italic>Rhizoctonia solani</italic> anastomosis group 1 subgroup 1A strain 1802/KB isolated from rice.</article-title> <source><italic>Genome Announc.</italic></source> <volume>5</volume>:<issue>e01188-17</issue>. <pub-id pub-id-type="doi">10.1128/genomeA.01188-17</pub-id> <pub-id pub-id-type="pmid">29074665</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pryszcz</surname> <given-names>L. P.</given-names></name> <name><surname>Gabald&#x00F3;n</surname> <given-names>T.</given-names></name></person-group> (<year>2016</year>). <article-title>Redundans: an assembly pipeline for highly heterozygous genomes.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>44</volume> <issue>e113</issue>. <pub-id pub-id-type="doi">10.1093/nar/gkw294</pub-id> <pub-id pub-id-type="pmid">27131372</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Quevillon</surname> <given-names>E.</given-names></name> <name><surname>Silventoinen</surname> <given-names>V.</given-names></name> <name><surname>Pillai</surname> <given-names>S.</given-names></name> <name><surname>Harte</surname> <given-names>N.</given-names></name> <name><surname>Mulder</surname> <given-names>N.</given-names></name> <name><surname>Apweiler</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2005</year>). <article-title>InterProScan: protein domains identifier.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>33</volume> <fpage>W116</fpage>&#x2013;<lpage>W120</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gki442</pub-id> <pub-id pub-id-type="pmid">15980438</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raaijmakers</surname> <given-names>J. M.</given-names></name> <name><surname>Paulitz</surname> <given-names>T. C.</given-names></name> <name><surname>Steinberg</surname> <given-names>C.</given-names></name> <name><surname>Alabouvette</surname> <given-names>C.</given-names></name> <name><surname>Mo&#x00EB;nne-Loccoz</surname> <given-names>Y.</given-names></name></person-group> (<year>2009</year>). <article-title>The rhizosphere: a playground and battlefield for soilborne pathogens and beneficial microorganisms.</article-title> <source><italic>Plant Soil</italic></source> <volume>321</volume> <fpage>341</fpage>&#x2013;<lpage>361</lpage>. <pub-id pub-id-type="doi">10.1007/s11104-008-9568-6</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>R&#x00E9;dei</surname> <given-names>G. P.</given-names></name></person-group> (<year>2008</year>). &#x201C;<article-title>CLUSTAL W (improving the sensitivity of progressive multiple sequence alignment through sequence weighting, position-specific gap penalties and weight matrix choice)</article-title>,&#x201D; in <source><italic>Encyclopedia of Genetics, Genomics, Proteomics and Informatics</italic></source>, (<publisher-loc>Dordrecht</publisher-loc>: <publisher-name>Springer</publisher-name>). <pub-id pub-id-type="doi">10.1007/978-1-4020-6754-9_3188</pub-id> <pub-id pub-id-type="pmid">34422537</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sayers</surname> <given-names>E. W.</given-names></name> <name><surname>Beck</surname> <given-names>J.</given-names></name> <name><surname>Brister</surname> <given-names>J. R.</given-names></name> <name><surname>Bolton</surname> <given-names>E. E.</given-names></name> <name><surname>Canese</surname> <given-names>K.</given-names></name> <name><surname>Comeau</surname> <given-names>D. C.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Database resources of the national center for biotechnology information.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>48</volume> <fpage>D9</fpage>&#x2013;<lpage>D16</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkz899</pub-id> <pub-id pub-id-type="pmid">31602479</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seppey</surname> <given-names>M.</given-names></name> <name><surname>Manni</surname> <given-names>M.</given-names></name> <name><surname>Zdobnov</surname> <given-names>E. M.</given-names></name></person-group> (<year>2019</year>). &#x201C;<article-title>BUSCO: assessing genome assembly and annotation completeness</article-title>,&#x201D; in <source><italic>Gene Prediction. Methods in Molecular Biology</italic></source>, <role>ed.</role> <person-group person-group-type="editor"><name><surname>Kollmar</surname> <given-names>M.</given-names></name></person-group> (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Humana Press Inc.</publisher-name>), <fpage>227</fpage>&#x2013;<lpage>245</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-9173-0_14</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shu</surname> <given-names>C.</given-names></name> <name><surname>Zhao</surname> <given-names>M.</given-names></name> <name><surname>Anderson</surname> <given-names>J. P.</given-names></name> <name><surname>Garg</surname> <given-names>G.</given-names></name> <name><surname>Singh</surname> <given-names>K. B.</given-names></name> <name><surname>Zheng</surname> <given-names>W.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Transcriptome analysis reveals molecular mechanisms of sclerotial development in the rice sheath blight pathogen <italic>Rhizoctonia solani</italic> AG1-IA.</article-title> <source><italic>Funct. Integr. Genomics</italic></source> <volume>19</volume> <fpage>743</fpage>&#x2013;<lpage>758</lpage>. <pub-id pub-id-type="doi">10.1007/s10142-019-00677-0</pub-id> <pub-id pub-id-type="pmid">31054140</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Song</surname> <given-names>L.</given-names></name> <name><surname>Shankar</surname> <given-names>D. S.</given-names></name> <name><surname>Florea</surname> <given-names>L.</given-names></name></person-group> (<year>2016</year>). <article-title>Rascaf: improving genome assembly with RNA sequencing data.</article-title> <source><italic>Plant Genome</italic></source> <volume>9</volume>:<issue>plantgenome2016.03.0027</issue>. <pub-id pub-id-type="doi">10.3835/plantgenome2016.03.0027</pub-id> <pub-id pub-id-type="pmid">27902792</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sperschneider</surname> <given-names>J.</given-names></name> <name><surname>Gardiner</surname> <given-names>D. M.</given-names></name> <name><surname>Dodds</surname> <given-names>P. N.</given-names></name> <name><surname>Tini</surname> <given-names>F.</given-names></name> <name><surname>Covarelli</surname> <given-names>L.</given-names></name> <name><surname>Singh</surname> <given-names>K. B.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>EffectorP: predicting fungal effector proteins from secretomes using machine learning.</article-title> <source><italic>New Phytol.</italic></source> <volume>210</volume> <fpage>743</fpage>&#x2013;<lpage>761</lpage>. <pub-id pub-id-type="doi">10.1111/nph.13794</pub-id> <pub-id pub-id-type="pmid">26680733</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stergiopoulos</surname> <given-names>I.</given-names></name> <name><surname>de Wit</surname> <given-names>P. J. G. M.</given-names></name></person-group> (<year>2009</year>). <article-title>Fungal effector proteins.</article-title> <source><italic>Annu. Rev. Phytopathol.</italic></source> <volume>47</volume> <fpage>233</fpage>&#x2013;<lpage>263</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.phyto.112408.132637</pub-id> <pub-id pub-id-type="pmid">19400631</pub-id></citation></ref>
<ref id="B68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tarailo-Graovac</surname> <given-names>M.</given-names></name> <name><surname>Chen</surname> <given-names>N.</given-names></name></person-group> (<year>2009</year>). <article-title>Using RepeatMasker to identify repetitive elements in genomic sequences.</article-title> <source><italic>Curr. Protoc. Bioinformatics</italic></source> <volume>Chapter 4</volume>:<issue>Unit 4.10</issue>. <pub-id pub-id-type="doi">10.1002/0471250953.bi0410s25</pub-id> <pub-id pub-id-type="pmid">19274634</pub-id></citation></ref>
<ref id="B69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Bueren</surname> <given-names>A. L.</given-names></name> <name><surname>Morland</surname> <given-names>C.</given-names></name> <name><surname>Gilbert</surname> <given-names>H. J.</given-names></name> <name><surname>Boraston</surname> <given-names>A. B.</given-names></name></person-group> (<year>2005</year>). <article-title>Family 6 carbohydrate binding modules recognize the non-reducing end of &#x03B2;-1,3-linked glucans by presenting a unique ligand binding surface.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>280</volume> <fpage>530</fpage>&#x2013;<lpage>537</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M410113200</pub-id> <pub-id pub-id-type="pmid">15501830</pub-id></citation></ref>
<ref id="B70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wei</surname> <given-names>M.</given-names></name> <name><surname>Wang</surname> <given-names>A.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Ma</surname> <given-names>L.</given-names></name> <name><surname>Niu</surname> <given-names>X.</given-names></name> <name><surname>Zheng</surname> <given-names>A.</given-names></name></person-group> (<year>2020</year>). <article-title>Identification of the novel effector RsIA_NP8 in <italic>Rhizoctonia solani</italic> AG1 IA that induces cell death and triggers defense responses in non-host plants.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>11</volume>:<issue>1115</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2020.01115</pub-id> <pub-id pub-id-type="pmid">32595615</pub-id></citation></ref>
<ref id="B71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Andersson</surname> <given-names>L.</given-names></name> <name><surname>Rupp</surname> <given-names>O.</given-names></name> <name><surname>Goesmann</surname> <given-names>A.</given-names></name> <name><surname>P&#x00FC;hler</surname> <given-names>A.</given-names></name> <name><surname>Varrelmann</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2016a</year>). <article-title>Draft genome sequence of the sugar beet pathogen <italic>Rhizoctonia solani</italic> AG2-2IIIB strain BBA69670.</article-title> <source><italic>J. Biotechnol.</italic></source> <volume>222</volume> <fpage>11</fpage>&#x2013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiotec.2016.02.001</pub-id> <pub-id pub-id-type="pmid">26851388</pub-id></citation></ref>
<ref id="B72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Andersson</surname> <given-names>L.</given-names></name> <name><surname>Tzelepis</surname> <given-names>G.</given-names></name> <name><surname>Rupp</surname> <given-names>O.</given-names></name> <name><surname>Blom</surname> <given-names>J.</given-names></name> <name><surname>Jelonek</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2016b</year>). <article-title>Genome analysis of the sugar beet pathogen <italic>Rhizoctonia solani</italic> AG2-2IIIB revealed high numbers in secreted proteins and cell wall degrading enzymes.</article-title> <source><italic>BMC Genomics</italic></source> <volume>17</volume>:<issue>245</issue>. <pub-id pub-id-type="doi">10.1186/s12864-016-2561-1</pub-id> <pub-id pub-id-type="pmid">26988094</pub-id></citation></ref>
<ref id="B73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Genzel</surname> <given-names>F.</given-names></name> <name><surname>Verwaaijen</surname> <given-names>B.</given-names></name> <name><surname>Blom</surname> <given-names>J.</given-names></name> <name><surname>Rupp</surname> <given-names>O.</given-names></name> <name><surname>Goesmann</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Draft genome sequence of the potato pathogen <italic>Rhizoctonia solani</italic> AG3-PT isolate Ben3.</article-title> <source><italic>Arch. Microbiol.</italic></source> <volume>199</volume> <fpage>1065</fpage>&#x2013;<lpage>1068</lpage>. <pub-id pub-id-type="doi">10.1007/s00203-017-1394-x</pub-id> <pub-id pub-id-type="pmid">28597196</pub-id></citation></ref>
<ref id="B74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Rupp</surname> <given-names>O.</given-names></name> <name><surname>Blom</surname> <given-names>J.</given-names></name> <name><surname>Jelonek</surname> <given-names>L.</given-names></name> <name><surname>Kr&#x00F6;ber</surname> <given-names>M.</given-names></name> <name><surname>Verwaaijen</surname> <given-names>B.</given-names></name><etal/></person-group> (<year>2015a</year>). <article-title>Development of a <italic>Rhizoctonia solani</italic> AG1-IB specific gene model enables comparative genome analyses between phytopathogenic R. <italic>solani</italic> AG1-IA, AG1-IB, AG3 and AG8 isolates.</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<issue>e0144769</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0144769</pub-id> <pub-id pub-id-type="pmid">26690577</pub-id></citation></ref>
<ref id="B75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wibberg</surname> <given-names>D.</given-names></name> <name><surname>Rupp</surname> <given-names>O.</given-names></name> <name><surname>Jelonek</surname> <given-names>L.</given-names></name> <name><surname>Kr&#x00F6;ber</surname> <given-names>M.</given-names></name> <name><surname>Verwaaijen</surname> <given-names>B.</given-names></name> <name><surname>Blom</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2015b</year>). <article-title>Improved genome sequence of the phytopathogenic fungus <italic>Rhizoctonia solani</italic> AG1-IB 7/3/14 as established by deep mate-pair sequencing on the MiSeq (Illumina) system.</article-title> <source><italic>J. Biotechnol.</italic></source> <volume>203</volume> <fpage>19</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbiotec.2015.03.005</pub-id> <pub-id pub-id-type="pmid">25801332</pub-id></citation></ref>
<ref id="B76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yamamoto</surname> <given-names>N.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Lin</surname> <given-names>R.</given-names></name> <name><surname>Liang</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>Y.</given-names></name> <name><surname>Zhu</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Integrative transcriptome analysis discloses the molecular basis of a heterogeneous fungal phytopathogen complex, <italic>Rhizoctonia solani</italic> AG-1 subgroups.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>9</volume>:<issue>19626</issue>. <pub-id pub-id-type="doi">10.1038/s41598-019-55734-2</pub-id> <pub-id pub-id-type="pmid">31873088</pub-id></citation></ref>
<ref id="B77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yang</surname> <given-names>G.</given-names></name> <name><surname>Li</surname> <given-names>C.</given-names></name></person-group> (<year>2012</year>). &#x201C;<article-title>General description of <italic>Rhizoctonia</italic> species complex</article-title>,&#x201D; in <source><italic>Plant Pathology</italic></source>, <role>ed.</role> <person-group person-group-type="editor"><name><surname>Cumagun</surname> <given-names>C.</given-names></name></person-group> (<publisher-loc>London</publisher-loc>: <publisher-name>INTECH Open Access Publisher</publisher-name>), <fpage>41</fpage>&#x2013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.5772/39026</pub-id></citation></ref>
<ref id="B78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>Y.</given-names></name> <name><surname>Ouyang</surname> <given-names>Y.</given-names></name> <name><surname>Yao</surname> <given-names>W.</given-names></name></person-group> (<year>2018</year>). <article-title>ShinyCircos: an R/Shiny application for interactive creation of Circos plot.</article-title> <source><italic>Bioinformatics</italic></source> <volume>34</volume> <fpage>1229</fpage>&#x2013;<lpage>1231</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btx763</pub-id> <pub-id pub-id-type="pmid">29186362</pub-id></citation></ref>
<ref id="B79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>H.</given-names></name> <name><surname>Yohe</surname> <given-names>T.</given-names></name> <name><surname>Huang</surname> <given-names>L.</given-names></name> <name><surname>Entwistle</surname> <given-names>S.</given-names></name> <name><surname>Wu</surname> <given-names>P.</given-names></name> <name><surname>Yang</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>DbCAN2: a meta server for automated carbohydrate-active enzyme annotation.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>46</volume> <fpage>W95</fpage>&#x2013;<lpage>W101</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gky418</pub-id> <pub-id pub-id-type="pmid">29771380</pub-id></citation></ref>
<ref id="B80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Fu</surname> <given-names>C.</given-names></name> <name><surname>Wang</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>H.</given-names></name> <name><surname>Cheng</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Comparative transcriptome analyses of gene expression changes triggered by <italic>Rhizoctonia solani</italic> AG1 IA infection in resistant and susceptible rice varieties.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>8</volume>:<issue>1422</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2017.01422</pub-id> <pub-id pub-id-type="pmid">28861102</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://genome.jgi.doe.gov/Tulca1/Tulca1.home.htm">http://genome.jgi.doe.gov/Tulca1/Tulca1.home.htm</ext-link></p></fn>
</fn-group>
</back>
</article>
