<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2014.00594</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research Article</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Annotation of a hybrid partial genome of the coffee rust (<italic>Hemileia vastatrix</italic>) contributes to the gene repertoire catalog of the Pucciniales</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Cristancho</surname> <given-names>Marco A.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/110035"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Botero-Rozo</surname> <given-names>David Octavio</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/143674"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Giraldo</surname> <given-names>William</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Tabima</surname> <given-names>Javier</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ria&#x000F1;o-Pach&#x000F3;n</surname> <given-names>Diego Mauricio</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/50544"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Escobar</surname> <given-names>Carolina</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/126997"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Rozo</surname> <given-names>Yomara</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Rivera</surname> <given-names>Luis F.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Dur&#x000E1;n</surname> <given-names>Andr&#x000E9;s</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/143297"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Restrepo</surname> <given-names>Silvia</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/188756"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Eilam</surname> <given-names>Tamar</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Anikster</surname> <given-names>Yehoshua</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/189955"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gait&#x000E1;n</surname> <given-names>Alvaro L.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://community.frontiersin.org/people/u/189152"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Plant Pathology, National Center for Coffee Research &#x02013; CENICAF&#x000C9;</institution> <country>Chinchin&#x000E1;, Colombia</country></aff>
<aff id="aff2"><sup>2</sup><institution>Departamento de Ciencias Biol&#x000F3;gicas, Universidad de los Andes</institution> <country>Bogot&#x000E1;, Colombia</country></aff>
<aff id="aff3"><sup>3</sup><institution>Institute for Cereal Crops Improvement, Tel Aviv University</institution> <country>Tel Aviv, Israel</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: S&#x000E9;bastien Duplessis, National Institute of Agronomic Research, France</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Guus Bakkeren, Agriculture and Agri-Food Canada, Canada; Diana Fernandez, Institut de Recherche Pour le D&#x000E9;veloppement, France</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: Marco A. Cristancho, Department of Plant Pathology, National Center for Coffee Research &#x02013; CENICAF&#x000C9;, Km 4 v&#x000ED;a a Manizales, Chinchin&#x000E1; 2427, Colombia e-mail: <email>marco.cristancho&#x00040;cafedecolombia.com</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Plant-Microbe Interaction, a section of the journal Frontiers in Plant Science.</p></fn>
<fn fn-type="present-address" id="fn003"><p>&#x02020;Present address: Diego Mauricio Ria&#x000F1;o-Pach&#x000F3;n, Lab&#x000F3;ratorio Nacional de Ci&#x000EA;ncia e Tecnologia do Bioetanol, Centro Nacional de Pesquisa em Energia e Materiais, Campinas, S&#x000E3;o Paulo, Brazil</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>31</day>
<month>10</month>
<year>2014</year>
</pub-date>
<pub-date pub-type="collection">
<year>2014</year>
</pub-date>
<volume>5</volume>
<elocation-id>594</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>05</month>
<year>2014</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>10</month>
<year>2014</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2014 Cristancho, Botero-Rozo, Giraldo, Tabima, Ria&#x000F1;o-Pach&#x000F3;n, Escobar, Rozo, Rivera, Dur&#x000E1;n, Restrepo, Eilam, Anikster and Gait&#x000E1;n.</copyright-statement>
<copyright-year>2014</copyright-year>
<license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract><p>Coffee leaf rust caused by the fungus <italic>Hemileia vastatrix</italic> is the most damaging disease to coffee worldwide. The pathogen has recently appeared in multiple outbreaks in coffee producing countries resulting in significant yield losses and increases in costs related to its control. New races/isolates are constantly emerging as evidenced by the presence of the fungus in plants that were previously resistant. Genomic studies are opening new avenues for the study of the evolution of pathogens, the detailed description of plant-pathogen interactions and the development of molecular techniques for the identification of individual isolates. For this purpose we sequenced 8 different <italic>H. vastatrix</italic> isolates using NGS technologies and gathered partial genome assemblies due to the large repetitive content in the coffee rust hybrid genome; 74.4% of the assembled contigs harbor repetitive sequences. A hybrid assembly of 333 Mb was built based on the 8 isolates; this assembly was used for subsequent analyses. Analysis of the conserved gene space showed that the hybrid <italic>H. vastatrix</italic> genome, though highly fragmented, had a satisfactory level of completion with 91.94% of core protein-coding orthologous genes present. RNA-Seq from urediniospores was used to guide the de novo annotation of the <italic>H. vastatrix</italic> gene complement. In total, 14,445 genes organized in 3921 families were uncovered; a considerable proportion of the predicted proteins (73.8%) were homologous to other Pucciniales species genomes. Several gene families related to the fungal lifestyle were identified, particularly 483 predicted secreted proteins that represent candidate effector genes and will provide interesting hints to decipher virulence in the coffee rust fungus. The genome sequence of Hva will serve as a template to understand the molecular mechanisms used by this fungus to attack the coffee plant, to study the diversity of this species and for the development of molecular markers to distinguish races/isolates.</p></abstract>
<kwd-group>
<kwd>genome</kwd>
<kwd>coffee rust</kwd>
<kwd>coffee</kwd>
<kwd>plant pathogens diversity</kwd>
<kwd>RNA-seq</kwd>
<kwd>genetic variants</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="4"/>
<equation-count count="0"/>
<ref-count count="68"/>
<page-count count="11"/>
<word-count count="9346"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="introduction" id="s1">
<title>Introduction</title>
<p>Coffee rust caused by the fungus <italic>Hemileia vastatrix</italic> (Hva) leads to widespread damage to crops worldwide. The disease develops polycyclic epidemics in a season, which means there is an overlapping succession of infection cycles. Under tropical conditions and in semi-perennial plants, such as coffee, Hva poses a permanent threat for producers. In the absence of control methods, the pathogen has been reported to cause losses of up to 30% in susceptible varieties of the species <italic>Coffea arabica</italic> during mild epidemics (Monaco, <xref ref-type="bibr" rid="B47">1977</xref>; Rivillas et al., <xref ref-type="bibr" rid="B56">2011</xref>). The fungus, which is a biotroph that targets <italic>Coffea</italic> as the single known host genus, spread from Africa and was responsible for the collapse of coffee production in India and Ceylon by the mid XIX century. It arrived in America in 1970, and since then, it has quickly disseminated to all the other coffee-producing areas of the continent. In Colombia, Hva was reported for the first time in 1983 in the central coffee-producing zone of the country (Leguizam&#x000F3;n et al., <xref ref-type="bibr" rid="B38">1984</xref>). The presence of Hva in almost every coffee plantation in the world has been one of the main drivers for plant breeders to release rust-resistant varieties. Recent outbreaks of the disease have affected major areas of coffee production in Colombia (Rozo et al., <xref ref-type="bibr" rid="B59">2012</xref>) and Central America (Cressey, <xref ref-type="bibr" rid="B13">2013</xref>), and the evidence linked these new epidemics to changes in weather patterns, including rainfall distribution and quantity (Cristancho et al., <xref ref-type="bibr" rid="B14">2012</xref>).</p>
<p>Multiple Hva races have been reported throughout the world (Rodrigues et al., <xref ref-type="bibr" rid="B57">1975</xref>; Carvalho et al., <xref ref-type="bibr" rid="B8">1987</xref>), and studies from the CIFC (Coffee Rust Research Center) in Portugal have identified over 30 races of the pathogen using a series of more than 40 differential coffee genotypes (Rodrigues et al., <xref ref-type="bibr" rid="B58">1993</xref>). Historically, race II has been predominant in most countries, and it attacks all cultivated varieties of the species <italic>C. arabica</italic> that have not been bred for disease resistance (Rodrigues et al., <xref ref-type="bibr" rid="B57">1975</xref>). In addition to race II, 6 other physiological races have been identified in Colombia using a set of differential plants developed at CIFC (Oeiras, Portugal), attacking some lines of the resistant cultivars (Castillo and Leguizam&#x000F3;n, <xref ref-type="bibr" rid="B11">1992</xref>; Gil and Ocampo, <xref ref-type="bibr" rid="B24">1998</xref>; Alvarado and Moreno, <xref ref-type="bibr" rid="B3">2005</xref>; Rozo et al., <xref ref-type="bibr" rid="B59">2012</xref>). At least 10 more isolates not differentiated by CIFC differential plants, remain to be characterized in Colombia, and several other unknown isolates have also been detected elsewhere (Gouveia et al., <xref ref-type="bibr" rid="B26">2005</xref>).</p>
<p>The emergence of new races and more aggressive isolates in plant pathogens threaten agriculture worldwide as recently observed with the wheat stem rust fungus and the new epidemics of coffee rust, which clearly indicate that further detailed studies and continuous monitoring are needed to improve integrated disease management strategies that mitigate their destructive effect (Aime et al., <xref ref-type="bibr" rid="B1">2006</xref>). Being obligate pathogens, the study of rust fungi biology is particularly challenging and needs substantial investments given the fact that a large set of differential plants have to be employed for the classification of races. The development of novel tools for the identification of isolates is critical to study the biology of these major plant pathogens and genomics might offer such tools. Differential Hva genes expressed in urediniospore, appressoria, and haustoria have already been identified (Fernandez et al., <xref ref-type="bibr" rid="B23">2012</xref>; Talhinhas et al., <xref ref-type="bibr" rid="B73">2014</xref>).</p>
<p>Genomic studies of plant pathogens have provided insights into their evolution, the mechanisms that generate genetic variability and the repertoire of genes that are involved in pathogenesis. These studies have shown that rust fungi exhibit very large genome sizes [<italic>Melampsora lini</italic> &#x0003D; Mli (Nemri et al., <xref ref-type="bibr" rid="B48">2014</xref>) is the largest fungal genome so far] compared to other fungi, containing very large numbers of genes, over 16,000 in most cases, compared to other fungi groups such as Ustilaginomycotina [<italic>U. maydis</italic> &#x0003D; 6786 protein coding genes (Schirawski et al., <xref ref-type="bibr" rid="B63">2010</xref>)] or other non-rust Pucciniomycotina such as <italic>Mixia osmundae</italic> (Toome et al., <xref ref-type="bibr" rid="B76a">2014</xref>). Rusts also show a large content in transposable elements (i.e., nearly 50%, in the genomes analyzed so far, Duplessis et al., <xref ref-type="bibr" rid="B19">2014</xref>). All these features indicate that rust genomes in general are complex to sequence and assemble due to the repetitive content and large genome size.</p>
<p>The discovery of predicted secreted virulence determinants in plant pathogens has also been possible through genomic analysis. Secreted proteins have been linked to the virulence of plant-pathogenic fungi (Spanu, <xref ref-type="bibr" rid="B66">2012</xref>) and many have been predicted in <italic>Melampsora</italic> spp. (Joly et al., <xref ref-type="bibr" rid="B34">2010</xref>; Hacquard et al., <xref ref-type="bibr" rid="B30">2012</xref>), <italic>P. striiformis</italic> (Cantu et al., <xref ref-type="bibr" rid="B6">2011</xref>, <xref ref-type="bibr" rid="B7">2013</xref>), <italic>P. graminis</italic> (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>), and <italic>H. vastatrix</italic> (Fernandez et al., <xref ref-type="bibr" rid="B23">2012</xref>). Thus, the discovery of the secreted protein genes (Saunders et al., <xref ref-type="bibr" rid="B60">2012</xref>) and the functional demonstration of their decisive role in the infection process help in unraveling previously unknown mechanisms of pathogenicity that operate in biotrophic fungi.</p>
<p>We have obtained genome and transcriptome sequences of the coffee rust fungus, and we expect these data to allow the identification of potential molecular markers for the study of rust isolates/races. The knowledge of the Hva genome and particularly of its secretome is a critical point for understanding the mechanisms used by the fungus during the colonization of coffee tissues and allows for comparisons of pathogenesis processes in other rust fungus-plant interactions. The chimeric genome assembly obtained was further used to define polymorphism between isolates and to analyse its basic contents such as the gene complement and TE families. The predicted proteome was additionally supported by a transcriptome analysis of Hva urediniospores. Within the predicted gene complement, a more precise analysis was performed on predicted secreted proteins, likely containing Hva candidate effectors.</p>
</sec>
<sec sec-type="results" id="s2">
<title>Results</title>
<sec>
<title>Nuclear DNA content</title>
<p>The nuclear DNA content of 10 Hva samples was measured by Flow cytometry analysis (Table <xref ref-type="table" rid="T1">1</xref>). Two groups could be distinguished among the 10 samples: one contains four samples that showed a lower content of 1.17&#x02013;1.29 pg of DNA and a second with the six remaining samples showed a higher content of 1.55&#x02013;1.76 pg of DNA per urediniospore (&#x0007E;30% more). Based on these results and compared to the genome size of <italic>P. triticina</italic> used as a control (135 Mb, Puccinia Group Genomes Database, Broad Institute), we estimate the genome size of Hva to be 243&#x02013;324 Mb.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p><bold>Nuclear DNA content of Hva urediniospore samples measured by FCM</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top"><bold><italic>Coffea</italic> species and genotypes</bold></th>
<th align="left" valign="top"><bold>Geographical location</bold></th>
<th align="center" colspan="2" valign="top"><bold>DNA Content (pg)</bold></th>
</tr>
<tr>
<th/>
<th/>
<th align="left" valign="top"><bold>Group 1</bold></th>
<th align="left" valign="top"><bold>Group 2</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> var. Caturra</td>
<td align="left" valign="top">La Alcanc&#x000ED;a, Antioquia</td>
<td align="center" valign="top">&#x02013;</td>
<td align="center" valign="top">1.63</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> var. Caturra</td>
<td align="left" valign="top">El Cedral, Pereira, Risaralda</td>
<td align="center" valign="top">&#x02013;</td>
<td align="center" valign="top">1.55</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> var. Caturra</td>
<td align="left" valign="top">Santa Mar&#x000ED;a, Antioquia</td>
<td align="center" valign="top">1.29</td>
<td align="center" valign="top">&#x02013;</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> var. Caturra (Acc. 1421)</td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">1.17</td>
<td align="center" valign="top">&#x02013;</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> BA-13</td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">&#x02013;</td>
<td align="center" valign="top">1.76</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica &#x000D7; C. canephora</italic>&#x02013;-Timor Hybrid H-419/2</td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">&#x02013;</td>
<td align="center" valign="top">1.62</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica &#x000D7; C. canephora</italic>&#x02013;-Timor Hybrid H-584</td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">1.21</td>
<td align="center" valign="top">&#x02013;</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> var. Tipica</td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">1.18</td>
<td align="center" valign="top">&#x02013;</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. arabica</italic> var. Mundo Novo</td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">&#x02013;</td>
<td align="center" valign="top">1.70</td>
</tr>
<tr>
<td align="left" valign="top"><italic>C. liberica</italic></td>
<td align="left" valign="top">Chinchin&#x000E1;, Caldas</td>
<td align="center" valign="top">&#x02013;</td>
<td align="center" valign="top">1.70</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Mean</td>
<td align="center" valign="top">1.21</td>
<td align="center" valign="top">1.66</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Standard deviation</td>
<td align="center" valign="top">0.05</td>
<td align="center" valign="top">0.08</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">CV%</td>
<td align="center" valign="top">5.87</td>
<td align="center" valign="top">6.41</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>Hva urediniospore samples were stained with Propidium Iodide for Flow Cytometry fluorescence measures following the protocol described by Eilam et al. (<xref ref-type="bibr" rid="B22">1994</xref>)</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Genome assemblies</title>
<p>We sequenced the genomes of the following isolates: HvCat, Hv387, Hv949, HvDQ952, HvH179, HvH569, HvH701, and HvMar; for isolate HvCat, Illumina and 454 sequencing were combined. We obtained a total of 412 million short-reads from Illumina and 5.8 million reads from 454. The fraction of reads that passed quality filtering was over 85% in all Hva Illumina sequenced samples but only 52% for the 454 Hva sequenced sample (Table <xref ref-type="supplementary-material" rid="SM1">S1</xref>, see methods section for filtering parameters). A hybrid 454-Illumina assembly was obtained, combining all genomic Hva sequences with the script clc_novo_assembly from the assembler suite CLC Assembly Cell v4.0.1 (CLC bio, Aarhus, Denmark); we have also performed separate assemblies of the genomes of each isolate. Unfortunately due to inherent characteristics and composition of the genomes (low GC content and richness in TE, detailed in the following sections), we were only able to obtain partial genome assemblies. In order to improve the overall genome assembly, our strategy was to generate an hybrid assembly that takes into account all reads obtained from the 8 isolates together to produce a unique sequence that is a chimera of the sequenced isolates. We were able to define a genome sequence of 333 Mb (129X sequencing depth) composed of 396,264 contigs and 302,466 scaffolds.</p>
<p>We assessed the completeness of the hybrid and individual genomes by running CEGMA with a set of 248 ultra-conserved Core Eukaryotic Genes (CEGs) (Parra et al., <xref ref-type="bibr" rid="B50">2007</xref>) (Table <xref ref-type="table" rid="T2">2</xref>). Statistics for the hybrid assembly are shown in Table <xref ref-type="table" rid="T3">3</xref>; based on the Hva chimeric assembly data, and using Jellyfish (Mar&#x000E7;ais and Kingsford, <xref ref-type="bibr" rid="B42">2011</xref>) to compute the number of distinct k-mers of different lengths and their relationship to coverage, we estimated the size of the Hva genome to be 333 Mb. Considering that the HvaHybrid genome sequence was the only one with a fairly good coverage of conserved core genes, we decided to use it as the reference genome for further analysis.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p><bold>Statistics gathered from the genome assemblies of Hva individual isolates and the hybrid assembly</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th align="left" valign="top"><bold>Sample IDs</bold></th>
<th align="left" valign="top"><bold><italic>Coffea</italic> species and genotypes</bold></th>
<th align="left" valign="top"><bold>Raw reads</bold></th>
<th align="left" valign="top"><bold>Clean reads<xref ref-type="table-fn" rid="TN1"><sup>a</sup></xref></bold></th>
<th align="left" valign="top"><bold>Contigs</bold></th>
<th align="left" valign="top"><bold>Assembly size</bold></th>
<th align="left" valign="top"><bold>Completeness<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref></bold></th>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">HvHybrid<xref ref-type="table-fn" rid="TN3"><sup>c</sup></xref></td>
<td/>
<td align="left" valign="top">412,417,464</td>
<td align="left" valign="top">359,076,496</td>
<td align="left" valign="top">396,264</td>
<td align="left" valign="top">333,258,024</td>
<td align="left" valign="top">91.94%</td>
</tr>
<tr>
<td align="left" valign="top">HvCat 454<xref ref-type="table-fn" rid="TN4"><sup>d</sup></xref></td>
<td/>
<td align="left" valign="top">5,860,446</td>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" valign="top">HvCat Illumina</td>
<td align="left" valign="top"><italic>C. arabica</italic> var. Caturra</td>
<td align="left" valign="top">48,396,016</td>
<td align="left" valign="top">43,704,716</td>
<td align="left" valign="top">254,645</td>
<td align="left" valign="top">122,820,521</td>
<td align="left" valign="top">57.26%</td>
</tr>
<tr>
<td align="left" valign="top">Hv387</td>
<td align="left" valign="top"><italic>C. canephora</italic> CII56</td>
<td align="left" valign="top">58,593,986</td>
<td align="left" valign="top">50,782,526</td>
<td align="left" valign="top">211,495</td>
<td align="left" valign="top">150,707,107</td>
<td align="left" valign="top">44.35%</td>
</tr>
<tr>
<td align="left" valign="top">Hv494</td>
<td align="left" valign="top">H89: <italic>C. arabica</italic> var. Bourbon resistant &#x000D7; <italic>C. arabica</italic> CaRCV3</td>
<td align="left" valign="top">55,326,774</td>
<td align="left" valign="top">47,738,686</td>
<td align="left" valign="top">211,728</td>
<td align="left" valign="top">138,293,025</td>
<td align="left" valign="top">35.08%</td>
</tr>
<tr>
<td align="left" valign="top">HvDQ952</td>
<td align="left" valign="top">F2 &#x02013; <italic>C. arabica</italic> var. Caturra &#x000D7; HdT 1343 (<italic>C. arabica</italic> &#x000D7; <italic>C. canephora</italic>)</td>
<td align="left" valign="top">43,875,056</td>
<td align="left" valign="top">38,844,164</td>
<td align="left" valign="top">197,927</td>
<td align="left" valign="top">121,119,448</td>
<td align="left" valign="top">31.85%</td>
</tr>
<tr>
<td align="left" valign="top">HvH_179</td>
<td align="left" valign="top">H3101: (<italic>C. arabica</italic> CaCV1 &#x000D7; Hdt (<italic>C. arabica</italic> &#x000D7; <italic>C. canephora</italic>) 1343 574CV2) &#x000D7; <italic>C. arabica</italic> CtyR</td>
<td align="left" valign="top">49,025,718</td>
<td align="left" valign="top">42,033,780</td>
<td align="left" valign="top">203,770</td>
<td align="left" valign="top">131,574,289</td>
<td align="left" valign="top">31.05%</td>
</tr>
<tr>
<td align="left" valign="top">HvH_569</td>
<td align="left" valign="top">H3041: (<italic>C. arabica</italic> &#x000D7; HarrarR3) &#x000D7; HdT(<italic>C. arabica</italic> &#x000D7; <italic>C. canephora</italic>) 1343 Africa 1386</td>
<td align="left" valign="top">51,960,392</td>
<td align="left" valign="top">45,000,606</td>
<td align="left" valign="top">202,168</td>
<td align="left" valign="top">133,358,100</td>
<td align="left" valign="top">37.50%</td>
</tr>
<tr>
<td align="left" valign="top">HvH_701</td>
<td align="left" valign="top">H2094: (<italic>C. arabica</italic> MundoNovo) &#x000D7; F502 (<italic>C. arabica</italic> accession from Tanganica)</td>
<td align="left" valign="top">60,634,018</td>
<td align="left" valign="top">53,080,264</td>
<td align="left" valign="top">215,628</td>
<td align="left" valign="top">158,292,515</td>
<td align="left" valign="top">56.86%</td>
</tr>
<tr>
<td align="left" valign="top">HvMar_1</td>
<td align="left" valign="top"><italic>C. arabica</italic> var. Caturra</td>
<td align="left" valign="top">44,605,504</td>
<td align="left" valign="top">39,408,690</td>
<td align="left" valign="top">203,360</td>
<td align="left" valign="top">125,814,765</td>
<td align="left" valign="top">22.18%</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="TN1">
<label>a</label>
<p><italic>Clean reads were obtained after quality trimming and removal of duplicates</italic>.</p>
</fn>
<fn id="TN2">
<label>b</label>
<p><italic>Completeness of the genome was calculated running the software CEGMA with a set of 248 ultra-conserved Core Eukaryotic Genes (CEGs) (Parra et al., <xref ref-type="bibr" rid="B50">2007</xref>)</italic>.</p>
</fn>
<fn id="TN3">
<label>c</label>
<p><italic>The hybrid assembly was generated by the combination of all short reads from the eight isolates</italic>.</p>
</fn>
<fn id="TN4">
<label>d</label>
<p><italic>Eight and a half plates were sequenced with 454 technology</italic>.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p><bold>Summary of the Hva genome hybrid assembly</bold>.</p></caption>
<table frame="hsides" rules="groups">
<tbody>
<tr>
<td align="left" colspan="2" valign="top">N&#x000B0; Contigs assembled</td>
<td align="left" valign="top">396,264</td>
</tr>
<tr>
<td align="left" colspan="2" valign="top">N&#x000B0; Scaffolds assembled</td>
<td align="left" valign="top">302,466</td>
</tr>
<tr>
<td align="left" colspan="2" valign="top">Total residues assembled</td>
<td align="left" valign="top">333,481,311</td>
</tr>
<tr>
<td align="left" valign="top">Length</td>
<td align="left" valign="top">Max</td>
<td align="left" valign="top">85,126</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Average</td>
<td align="left" valign="top">841.56</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">N50</td>
<td align="left" valign="top">1,59</td>
</tr>
<tr>
<td align="left" valign="top">Reads</td>
<td align="left" valign="top">Total</td>
<td align="left" valign="top">336,649,188</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Unassembled</td>
<td align="left" valign="top">197,88,611</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Assembled</td>
<td align="left" valign="top">316,860,577</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Multihit</td>
<td align="left" valign="top">37,520,793</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Potential pairs</td>
<td/>
</tr>
<tr>
<td/>
<td align="left" valign="top">Paired</td>
<td align="left" valign="top">78,105,740</td>
</tr>
<tr>
<td/>
<td align="left" valign="top">Not Paired</td>
<td align="left" valign="top">255,469,308</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>The 454 and Illumina clean reads were assembled and the same reads were mapped against this set of assembled contigs using the software CLC Assembly Cell v4.0.1</italic>.</p>
</table-wrap-foot>
</table-wrap>
<p>A total of 23.2% of the paired-end reads mapped in the same contig of the HvaHybrid genome assembled. Most unpaired reads (66.8%) matched two different contigs (useful for scaffolding, data not shown). Several contigs displayed coverage greater than 100X, but most of the contigs exhibited low coverage (Figure <xref ref-type="fig" rid="F1">1</xref>); however, over-coverage was pronounced in the short contigs (Figure <xref ref-type="fig" rid="F2">2</xref>). We also illustrated the range of coverage of the contigs and its association to the contigs size (Figure <xref ref-type="fig" rid="F3">3</xref>). The largest contig, Hvcontig_23458 (85 Kbp) showed good coverage. However, the next two contigs in size, Hvcontig_171 (45 kbp) and Hvcontig_161 (71 kbp), showed over-coverage and belong to the Hva mitochondria (see below). Bacterial contamination was very low representing less than 1% of the sequences (Figure <xref ref-type="fig" rid="F4">4</xref>).</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>Plot representing the reads coverage per contig in the HvHybrid assembly</bold>. Low read coverage was identified in most contigs.</p></caption>
<graphic xlink:href="fpls-05-00594-g0001.tif"/>
</fig>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p><bold>Association between number of reads and size of contigs in the HvHybrid Assembly</bold>. Over-coverage was identified in short contigs.</p></caption>
<graphic xlink:href="fpls-05-00594-g0002.tif"/>
</fig>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p><bold>Association between contig size and coverage</bold>. Contigs were clustered by color by running an R script: 0&#x02013;5 low coverage, 5&#x02013;45 good coverage, 45&#x02013;100 high coverage and more than 100 over-coverage.</p></caption>
<graphic xlink:href="fpls-05-00594-g0003.tif"/>
</fig>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p><bold>Analysis of sequence contamination in the HvHybrid assembly</bold>. The HvHybrid assembled contigs were searched for contaminants with the program Megan4 (Huson et al., <xref ref-type="bibr" rid="B33">2001</xref>). Each node is labeled by a taxon and the number of reads assigned to the taxon. The size of a node (circle size) is scaled logarithmically to represent the number of assigned reads. A low bacterial and plant sequence contamination was identified in the assembly.</p></caption>
<graphic xlink:href="fpls-05-00594-g0004.tif"/>
</fig>
</sec>
<sec>
<title>Mitochondrial genome annotation</title>
<p>We used the <italic>P. graminis</italic> f.sp. <italic>tritici</italic> (PGT) (Puccinia Group Genomes Database, Broad Institute) mitochondrial genome to find homologs in the <italic>HvHybrid</italic> assembly by BLAST (<italic>e</italic> &#x0003D; 1e-5). BLAST sequence similarities were pictured using the visualizing tool Circoletto (Darzentas, <xref ref-type="bibr" rid="B16">2010</xref>). As shown in Figure <xref ref-type="fig" rid="F5">5</xref>, Hvcontig_161 (71,379 bp, %GC &#x0003D; 33%) and Hvcontig_171 (45,581 bp, %GC &#x0003D; 35%) cover over 70% of the mitochondrial genome of PGT. We also found that 7 contigs of the HvCat assembly entirely covered the mitochondrial genomes of PGT (79,748 bp) and the soybean rust <italic>Phakopsora pachyrhizi</italic> (31,825 bp; Stone et al., <xref ref-type="bibr" rid="B71">2010</xref>) (results not shown). From this analysis we estimate that the Hva mitochondrial genome it is at least of the size of the PGT mitochondrial genome.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p><bold>Homology of Hva mitochondrial sequences to the mitochondrial genome of PGT</bold>. Clone_161 and clone_171 sequences from HvHybryd assembly were compared to the mitochondrial genome of <italic>P. graminis</italic> f.sp <italic>tritici</italic> (Supercontig_2.393; 79,2Kb) by running BLAST sequence similarities (<italic>e</italic> &#x0003D; 1e-5). Homologous regions are illustrated with Circoletto (Darzentas, <xref ref-type="bibr" rid="B16">2010</xref>).</p></caption>
<graphic xlink:href="fpls-05-00594-g0005.tif"/>
</fig>
</sec>
<sec>
<title>De novo identification of transposons</title>
<p>The genomes of rust fungi sequenced to date all contain large numbers of transposable elements, which is a major problem for proper assembly (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>; Zheng et al., <xref ref-type="bibr" rid="B79">2013</xref>). A careful annotation of TEs was performed in the chimeric assembly and it showed that the Hva genome also contained a large proportion of repeated sequences. Interspersed repeats were identified in 74.4% of the Hva assembled hybrid contigs using the algorithm RepeatMasker. A similar fraction of repeats was identified in the individual assemblies (71&#x02013;74%). A large proportion of repeats were classified as LTR elements (38.7%), a smaller proportion was classified as DNA elements (7.2%), only 2.1% were classified as LINEs, and 26.3% of repeats were unclassified.</p>
<p>The sequences were annotated for the presence of LTRs, direct repeats and inverted repeats as well as sequence similarities to repeat sequences from Pucciniales. Four novel retrotransposon families were identified in the Hva genome (Table <xref ref-type="supplementary-material" rid="SM1">S2</xref>).</p>
</sec>
<sec>
<title>Predicting protein-coding genes</title>
<p>In order to capture the gene space of the coffee rust genome, we performed a transcriptome analysis of freshly harvested urediniospores based on Illumina RNA-Seq. A total of 44,297&#x02013;64,752 transcripts could be identified in the three RNA-seq based libraries with the program Trinity, with the HvCatNor normalized library holding the smallest number of genes (Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>). We aligned those transcripts onto the chimeric and individual samples assemblies and showed that the normalized library contains the largest fraction of Hva expressed mapped genes (Table <xref ref-type="supplementary-material" rid="SM1">S4</xref>). The normalization approach decreases the prevalence of high abundance transcripts and equalizes transcript concentrations in a cDNA sample, thereby increasing the discovery of low abundance transcripts. The level of contamination of the Hva RNA-seq datasets with plant, bacterial and other contaminant sequences was moderate; the fraction of contamination for each sample was 13.6% for the normalized library HvCatNor, 12,3% for the HvH420_701 library, and 18,9% for the HvCat955 library (Table <xref ref-type="supplementary-material" rid="SM1">S5</xref>). We carried out homology annotation with BLAST against Hva germinating urediniospore transcripts dataset and other rusts predicted proteins datasets (Table <xref ref-type="table" rid="T4">4</xref>). Our Hva urediniospores dataset is as expected very similar to the Hva germinating urediniospores transcripts identified by Talhinhas et al. (<xref ref-type="bibr" rid="B73">2014</xref>).</p>
<table-wrap position="float" id="T4">
<label>Table 4</label>
<caption><p><bold>Homology of Hva transcript datasets to Pucciniales predicted proteins</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead>
<tr>
<th/>
<th/>
<th align="center" colspan="3" valign="top"><bold>Hva urediniospore transcripts</bold></th>
</tr>
<tr>
<th align="left" valign="top"><bold>Hva samples<xref ref-type="table-fn" rid="TN5"><sup>a</sup></xref></bold></th>
<th align="center" valign="top"><bold>Assmbled transcripts</bold></th>
<th align="left" valign="top"><bold>HvCatNor</bold></th>
<th align="left" valign="top"><bold>HvH420_701</bold></th>
<th align="left" valign="top"><bold>HvCat955</bold></th>
</tr>
<tr>
<td align="left" colspan="5" valign="top"><bold>I</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td align="left" valign="top">Hva (gU)</td>
<td align="center" valign="top">4267</td>
<td align="left" valign="top">91.0% (3884)</td>
<td align="left" valign="top">93.1% (3973)</td>
<td align="left" valign="top">93.9% (4007)</td>
</tr>
<tr>
<td align="left" valign="top"><italic>H. vastatrix</italic> (Ap)</td>
<td align="center" valign="top">3627</td>
<td align="left" valign="top">59.2% (2147)</td>
<td align="left" valign="top">63.1% (2290)</td>
<td align="left" valign="top">63.8% (2315)</td>
</tr>
<tr>
<td align="left" valign="top"><italic>H. vastatrix</italic> (H)</td>
<td align="center" valign="top">4465</td>
<td align="left" valign="top">50.0% (2232)</td>
<td align="left" valign="top">49.1% (2202)</td>
<td align="left" valign="top">49.6% (2229)</td>
</tr>
<tr>
<td align="left" valign="top"><bold>Rust species</bold></td>
<td align="center" valign="top"><bold>Predicted proteins</bold></td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td align="left" colspan="5" valign="top"><bold>II</bold></td>
</tr>
<tr>
<td align="left" valign="top"><italic>Pt</italic></td>
<td align="center" valign="top">11,630</td>
<td align="left" valign="top">42.2% (18,703)</td>
<td align="left" valign="top">40.0% (22,240)</td>
<td align="left" valign="top">36.6% (23,705)</td>
</tr>
<tr>
<td align="left" valign="top"><italic>Pgt</italic></td>
<td align="center" valign="top">15,979</td>
<td align="left" valign="top">43.8% (19,411)</td>
<td align="left" valign="top">41.5% (23,129)</td>
<td align="left" valign="top">37.8% (24,480)</td>
</tr>
<tr>
<td align="left" valign="top"><italic>Pst</italic></td>
<td align="center" valign="top">22,815</td>
<td align="left" valign="top">43.5% (19,257)</td>
<td align="left" valign="top">40.4% (22,544)</td>
<td align="left" valign="top">36.9% (23,874)</td>
</tr>
<tr>
<td align="left" valign="top"><italic>Mlp</italic></td>
<td align="center" valign="top">16,694</td>
<td align="left" valign="top">39.2% (17,385)</td>
<td align="left" valign="top">40.8% (22,765)</td>
<td align="left" valign="top">37.8% (21,302)</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>I. Homology sequence analysis between Hva transcriptomes datasets (this study) and Hva germinating urediniospores, appresoria, and haustoria transcript sequences (gU, Ap, H, Talhinhas et al., <xref ref-type="bibr" rid="B73">2014</xref>) was performed with the program BLASTn and an E &#x0003D; 1e<sup>&#x02212;20</sup>. II. BLASTx sequence similarity analysis of H. vastatrix RNA-seq sequences and other rust predicted protein datasets (E &#x0003D; 1e<sup>&#x02212;3</sup>). Numbers represent fraction (%) of hits found</italic>.</p>
<fn id="TN5">
<label>a</label>
<p><italic>Hva samples described in Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>)</italic>.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>The predictions of the gene coding space was performed using TopHat (Trapnell et al., <xref ref-type="bibr" rid="B76">2009</xref>) for mapping of RNA-seq data against the HvHybrid genome assembly and proteins were predicted with Augustus (Stanke and Waack, <xref ref-type="bibr" rid="B70">2003</xref>; size filter &#x0003D; 70 amino-acids), using the RNA-Seq data as a guide. We identified a total of 21,345 contigs that matched the RNA-seqs and we predicted a total of 18,234 protein sequences with an average length of 1047 bp for the gene models. We identified 13,796 Hva protein homologs (73.86%) in the Pucciniales order (67,118 sequences) using blastp (<italic>e</italic> &#x0003D; 1e-3).</p>
<p>The total set of sequences was filtered to remove repeats identified in RepBase Release 17.01, and this resulted in a final set containing 14,445 predicted protein-coding gene sequences. Over 96% of this set of gene models was identified in the individual assemblies (Table <xref ref-type="supplementary-material" rid="SM1">S6</xref>). We explored this set of predicted proteins searching for KOGs in the NCBI Conserved Domain Database; 8458 Hva protein-coding genes having a KOG homolog were functionally annotated (Table <xref ref-type="supplementary-material" rid="SM1">S7</xref>). A total of 3921 gene families with 2&#x02013;66 gene members were identified with OrthoMCL (Table <xref ref-type="supplementary-material" rid="SM1">S8</xref>); we also identified 2103 orphan genes.</p>
</sec>
<sec>
<title>Secretome annotation</title>
<p>We predicted 659 secreted proteins using PProwler and 775 secreted proteins with the SignalP algorithm. A total of 180 proteins in our Hva set presented homologs with the secreted proteins already predicted in Hva (Fernandez et al., <xref ref-type="bibr" rid="B23">2012</xref>). A Venn diagram (Figure <xref ref-type="fig" rid="F6">6</xref>) showed shared and unique coincidences between the three sets of data, including 44 proteins extracted by comparison with the dataset predicted by Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>). Most of the secreted proteins predicted are organized in gene families and they were mapped with tblastx to at least one contig from each of the individual assemblies; a final set of 28 predicted proteins was obtained after filtering those belonging to the same gene family and they were functionally annotated with blastp against swissprot, RefSeq, Uniref100 and the non-redundant protein sequences databases (Table <xref ref-type="supplementary-material" rid="SM1">S9</xref>). Only five sequences did not have a homolog sequence with other Pucciniales fungi. Six sequences had a homolog already identified as a secreted protein in <italic>M. larici-populina</italic>. We did not identify in the genome of Hva a homolog of ps87 of <italic>P. striiformis</italic> f.sp. <italic>tritici</italic>, a conserved secreted protein in several fungal plant pathogens (Gu et al., <xref ref-type="bibr" rid="B28">2011</xref>). However, an identical copy of the Hva RTP1 gene (GenBank: FR851895), a transferred protein belonging to the family of effectors in rusts (Pretsch et al., <xref ref-type="bibr" rid="B52">2013</xref>) was identified, suggesting that some effectors are very well conserved between different rust species (Spanu, <xref ref-type="bibr" rid="B66">2012</xref>).</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p><bold>Venn diagram showing the consensus set of Hva secreted predicted proteins</bold>. PProwler (0.9 probability cut-off) and SignalP were used to predict secreted proteins. A set of 14,445 putative proteins was used for classification into secreted and non-secreted proteins. The results were compared with Hva secreted proteins predicted by Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>). Hva secreted proteins predictions: <bold>(I)</bold> PProwler (this study). <bold>(II)</bold> SignalP (this study). <bold>(III)</bold> Secreted proteins predicted by Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>).</p></caption>
<graphic xlink:href="fpls-05-00594-g0006.tif"/>
</fig>
<p>We identified homologs of the predicted secreted proteins in all but one of the Hva individual assemblies; a homolog of protein KF018005 was not identified in the assembly of HvCat. The secreted proteins mapping to the individual assemblies showed that 6 proteins were identical in every Hva sample. The remaining 22 predicted proteins displayed polymorphism in at least two isolates (Table <xref ref-type="supplementary-material" rid="SM1">S10</xref>).</p>
<p>For Hva proteins KF018008, KF018015, KF018016, KF018020, KF018028 we did not find evidence of predicted homologs in other rusts, representing unique genes of the coffee-rust interaction not represented in other pathosystems. Interestingly, protein KF018020 had no homolog in any database and we could not detect polymorphisms of this protein-coding gene in the Hva individual assemblies, but the Hva genome holds 32 copies of this gene. Protein KF018028, represented by a single copy in the genome, is surprisingly the most diverse of the Hva secreted proteins. It is worth noting that it does not have homologs in any other organism.</p>
</sec>
<sec>
<title>Protein kinases (PKs)</title>
<p>Given the fact that PKs are involved in essential pathways related to development and adaptation to different environments (Miranda and Barton, <xref ref-type="bibr" rid="B46">2007</xref>), we determined differences between PKs families present in pathogen and non-pathogen basidiomycetes. A total of 210 PKs were identified within the set of Hva predicted proteins using HMM3 (Eddy, <xref ref-type="bibr" rid="B21">2011</xref>).</p>
<p>This set of sequences was compared against the predicted PKs of other Pucciniales showing that most protein kinases, including gene families coding for signal transduction pathways, are shared between rust genomes (Table <xref ref-type="supplementary-material" rid="SM1">S11</xref>). We wanted to know the protein kinases exclusively found in pathogenic basidiomycetes and for that we run a BLASTp homology search of PKs of five pathogenic species, <italic>H. vastatrix, P. graminis</italic> f.sp <italic>tritici</italic>, <italic>P. triticina</italic>, <italic>M. larici-populina</italic>, and <italic>U. maydis</italic> against predicted PKs of the non-pathogenic basidiomycetes <italic>Coprinopsis cinerea</italic> (Stajich et al., <xref ref-type="bibr" rid="B68">2010</xref>) and <italic>Laccaria bicolor</italic> (Martin et al., <xref ref-type="bibr" rid="B43">2008</xref>). There are 18 PKs unique to the genomes of plant pathogenic fungi (Table <xref ref-type="supplementary-material" rid="SM1">S12</xref>) and we identified 236 PKs sequences present in <italic>C. cinerea</italic> and <italic>L. bicolor</italic> but not in pathogenic fungi. In the later group we highlight functions TKL/TKL, PKL/ccin9, PKL/CAK/Fmp29, FunK1, AgaK1, atypical/PIKK/TRRAP, and atypical/HisK PKs families because they were not identified in any of the pathogen species although they are expanded in unique families in <italic>C. cinerea</italic> (Stajich et al., <xref ref-type="bibr" rid="B68">2010</xref>) and <italic>L. bicolor</italic> (Martin et al., <xref ref-type="bibr" rid="B43">2008</xref>).</p>
</sec>
</sec>
<sec sec-type="discussion" id="s3">
<title>Discussion</title>
<p>We have generated a de novo hybrid genome assembly of the coffee rust from the sequence of 8 rust samples. We also assembled transcript sequences obtained from normalized and non-normalized RNA-seq libraries representing the urediniospore stage of the fungus. The hybrid genome assembly was the most comprehensive in terms of capturing the largest proportion of the gene space in Hva, therefore offering a picture of a chimeric genome of this species. There appears to be a large extent of repetitive sequences in this chimeric genome, which was evident in our hybrid assembly, as shown by over-covered contigs. For example, two of the three largest contigs showed over-coverage and this event was also found in most contigs shorter than 400 bp. Contamination analysis showed the presence of Bacteria and Viridiplantae sequences in the sequencing reads but the fraction of these sequences was very low. The limitation of having to collect spore samples from plant tissue renders it impossible to have samples free of other organisms; consequently, finding bacterial, plant and other DNA sequences was not unexpected.</p>
<p>We estimated the Hva genome size to be 243&#x02013;324 Mb by FCM and the assembled scaffolds size was close to the larger figure (333 Mb). Differences between the relative amounts of DNA measured by FCM might be due to the presence of a mixture of different cells containing different number of nuclei in the Hva samples tested; Hva urediniospores in coffee leaves carry out meiosis giving rise to spores at different stages of development containing unequal numbers of nuclei in a process referred as cryptosexuality (Carvalho et al., <xref ref-type="bibr" rid="B9">2011</xref>). A similar mechanism of parasexual recombination has been described in <italic>P. triticina</italic> (Wang and McCallum, <xref ref-type="bibr" rid="B77">2009</xref>). The haplophase has not been recognized in Hva and only urediniospores and teliospores representing the dikaryophase have been identified (De Castro et al., <xref ref-type="bibr" rid="B17">2009</xref>).</p>
<p>Our Hva genome size estimates fall remarkably short of recent measurements of 733 Mbp (Carvalho et al., <xref ref-type="bibr" rid="B10">2014</xref>) and 796.8 Mbp (Tavares et al., <xref ref-type="bibr" rid="B74">2014</xref>) obtained by FCM of Hva nuclei isolated from urediniospores. Highly repetitive genomes such as the Hva genome are complex to sequence and analyze and genomes with a high content of repeats are difficult to sequence completely (Sun et al., <xref ref-type="bibr" rid="B72">2003</xref>). Overall, the Hva genome size is larger compared with other fungal genomes, including the Basidiomycetes <italic>M. larici-populina</italic> (101.1 Mb), <italic>P. graminis</italic> f.sp. <italic>tritici</italic> (88.6 Mb) (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>), and <italic>Laccaria bicolor</italic> (68.9 Mb) (Martin et al., <xref ref-type="bibr" rid="B43">2008</xref>), the arbuscular mycorrhizal fungus <italic>Rhizophagus irregularis</italic> (153 Mb) (Tisserant et al., <xref ref-type="bibr" rid="B75">2013</xref>), and the Ascomicota <italic>Tuber melanosporum</italic> (125 Mb) (Martin et al., <xref ref-type="bibr" rid="B44">2010</xref>), and <italic>Blumeria graminis</italic> f.sp. <italic>tritici</italic> (174 Mb) (Parlange et al., <xref ref-type="bibr" rid="B49">2011</xref>).</p>
<p>Our analysis indicated that the Hva mitochondrial genome is at least the size of the <italic>P. graminis</italic> mitochondria. The different genome size estimates obtained so far make imperative the assembly of an Hva genome from a single Hva isolate to clearly elucidate the real nuclear genome size, mitochondrial genome size and fraction of repetitive sequences for this fungus.</p>
<p>We identified a large fraction of repetitive sequences in the hybrid genome; 74.4% of the assembled contigs contain repetitive sequences, with most of them representing transposable elements. Because of the hybrid nature of the assembly, this might be and over-estimate of the real fraction of repetitive sequences present in the genome. However, given the large estimates for the Hva genome size, we expect the genome sequence to contain a large proportion of repeats. A high proportion of transposable elements have also been identified in the genomes of other rusts (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>; Zheng et al., <xref ref-type="bibr" rid="B79">2013</xref>) and the plant pathogen <italic>Blumeria graminis</italic> (Spanu et al., <xref ref-type="bibr" rid="B67">2010</xref>). Genome expansion caused by the replication of TEs has been shown to occur in filamentous fungal and oomycete pathogens of plants, and some expansion of virulence-related genes are associated with their large genome size (Kemen and Jones, <xref ref-type="bibr" rid="B35">2012</xref>). The high diversity of many <italic>Avr</italic>-genes in the rice blast fungus <italic>Magnaporthe grisea</italic> is related to their association with repeated sequences (Huang et al., <xref ref-type="bibr" rid="B32">2014</xref>). On the other hand, the non-pathogen basidiomycetes <italic>L. bicolor</italic> (Martin et al., <xref ref-type="bibr" rid="B43">2008</xref>) and <italic>C. cinerea</italic> (Stajich et al., <xref ref-type="bibr" rid="B68">2010</xref>) harbor a much-reduced proportion of repeated sequences. Whether the genome of Hva has suffered an expansion of virulence-related genes mediated by transposition events should be investigated in further detail. Given the fact that a hybrid genome might contain an over-representation of the fraction of repetitive elements present in single genomes, there is still need to be cautious about the final proportion of repeats in the Hva genome.</p>
<p>The assembly exhibited a high level of fragmentation as shown by the large number of scaffolds obtained in the final assembly and the low N50 value. This fragmentation can be explained by the highly repetitive nature of the Hva genome. It should be possible in the future to improve this assembly by sequencing large insert libraries that will aid in resolving the repetitive nature and to enlarge scaffolds of the Hva assembly (Raffaele and Kamoun, <xref ref-type="bibr" rid="B55">2012</xref>). An additional approach that might be implemented to improve our current hybrid assembly would be to use a &#x0201C;fosmid-to-fosmid&#x0201D; strategy as that followed by Zheng et al. (<xref ref-type="bibr" rid="B79">2013</xref>), who significantly improved an earlier assembly of the <italic>P. striiformis</italic> f.sp. <italic>triticina</italic> genome (Cantu et al., <xref ref-type="bibr" rid="B6">2011</xref>). The GC content of the Hva genome (33%) was lower than <italic>M. larici-populina</italic> (41%), and <italic>P. graminis</italic> f.sp <italic>tritici</italic> (43.3%) (Duplessis et al., <xref ref-type="bibr" rid="B19">2014</xref>). This difference could be explained by GC repetitive sequences collapsing into contigs, therefore yielding a GC content reduction because GC sequences are underrepresented. Though the hybrid Hva genome assembly was highly fragmented, the CEGMA analysis indicated that a significant amount of the genome&#x00027;s gene space was revealed and we consider the current hybrid assembly to be representative of the gene space of a chimeric Hva genome.</p>
<p>Comparative genomics showed considerable similarities between Hva and other rust fungal genomes; over 73% of Hva predicted proteins had homologs among Pucciniales protein datasets. Although rust genomes vary in size, they are very similar in gene content suggesting the presence of a large core set of rust fungus specific genes needed for their pathogenicity. It will also be significant to study the function and specificity of Hva predicted proteins not found in other rusts and study their virulence species-specific adaptations. All in all this set of Hva predicted proteins represent a valuable resource that contributes to the Pucciniales gene repertoire.</p>
<p>In order to capture the gene space of the coffee rust genome, we performed a transcriptome analysis of freshly harvested urediniospores based on Illumina RNA-Seq. The number of secreted proteins predicted in this study is smaller than the number found in <italic>M. larici-populina</italic> (1184 SSPs) and <italic>P. graminis</italic> f.sp. <italic>tritici</italic> (1106 SSPs) genomes (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>), perhaps reflecting the Hva partial genome assembled. Also, it has to be considered that <italic>M. larici-populina</italic> and <italic>P. graminis</italic> f.sp. <italic>tritici</italic> SSPs were predicted with the SignalP, TargetP, and TMHMM algorithms while we did not include TMHMM in our predictions. The non-inclusion of TMHMM transmembrane protein predictions in some way renders our current set of secreted proteins incomplete. On the whole, this set of Hva predicted secreted-proteins is a basic tool for the identification of pathogenicity-related genes as shown for other rusts (Joly et al., <xref ref-type="bibr" rid="B34">2010</xref>; Cantu et al., <xref ref-type="bibr" rid="B6">2011</xref>). It is possible that avirulence elicitors be present among the set of predicted secreted proteins, as it has been found in flax rust (Catanzariti et al., <xref ref-type="bibr" rid="B12">2006</xref>). For Hva proteins KF018008, KF018015, KF018016, KF018020, KF018028 we did not find evidence of predicted homologs in other rusts, representing unique genes of the coffee-rust interaction not represented in other pathosystems; secreted proteins have been found to be lineage-specific in other rusts as well (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>). Overall analysis of the Hva predicted secretome shows that secreted proteins are well conserved among plant rusts and that they include functions most likely involved in the pathogenesis of the fungus. Therefore, this group of annotated secreted proteins suits well as prime candidates for functional testing.</p>
<p>The Hva genome contains most of the gene families coding for signal transduction pathways identified in the genomes of other rust fungi. It is assumed that these gene families are involved in signal perception mechanisms of rust urediniospores (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>) and gives them a highly specialized mechanism for the detection of stomata (Kemen and Jones, <xref ref-type="bibr" rid="B35">2012</xref>). We have grouped the candidate PKs with signal perception roles related to pathogenesis in 18 gene families, those identified in pathogen basidiomycetes but absent in non-pathogenic species.</p>
<p>Illumina and 454 sequencing was used to generate a draft genome in different Hva isolates. Due to the complexity of the genome sequence&#x02014;similar to other rust fungi- a minimal draft chimeric genome was defined by considering the genome of the different isolates altogether. The genome sequence is a novel resource in Pucciniales, a group that includes many species that are economically major diseases of several crops. It provides data to study the evolution of this important group of plant pathogens. The draft genome sequence of Hva will serve as a template for future assemblies of isolates of this fungus and to understand the molecular mechanisms used by this pathogen to attack the coffee plant and to study its diversity. It will also be the basis for the development of molecular markers to distinguish races/isolates given the enormous difficulties of trying to identify coffee rust races by the use of differential plants. The genomic data of the coffee leaf rust presented here are a reference to track changes in field populations, to characterize the decline in sensitivity against widely used fungicides such as triazoles and strobilurins that are used in coffee rust disease management, and to preserve genotype identity in fungal collections. The increased use of coffee rust-resistant varieties will increase the selective pressure to favor complex fungal genotypes, and resources such as the secretome set is the cornerstone for the development of innovative resistance mechanisms to control this pathogen.</p>
</sec>
<sec sec-type="materials and methods" id="s4">
<title>Materials and methods</title>
<sec>
<title>Nuclear DNA content estimated by FCM</title>
<p>Flow cytometry (FCM) was used to estimate nuclear DNA content in urediniospores of <italic>H. vastatrix</italic>, following the protocol described by Eilam et al. (<xref ref-type="bibr" rid="B22">1994</xref>), modified for the uredinial stage. Urediniospores were suspended in 0.1% Tween 20 in water for 20 min. The suspension was incubated for 2 min. in a 1000-watt microwave on 50% power level, adding Propidium Iodide and RNase to final concentrations of 4 &#x003BC;g/ml and 50 &#x003BC;g/ml respectively, and incubated for 1 h at 37&#x000B0;C. The urediniospores samples were run on a Bacton Dickinson FACS IV flow cytometer. Urediniospores of <italic>P. triticina</italic> were used as a control. Data from the flow cytometer were analyzed using the Flowing Software v2.5 at the Centre for Biotechnology University of Turku, Finland. Urediniospores of Hva and <italic>P. triticina</italic> were stained and analyzed simultaneously, with the standard control positioned on channel 200. The <italic>C</italic>-Value (pg) was converted to base pairs (bp), considering that 1pg &#x0003D; 978 Mb (Dolezel et al., <xref ref-type="bibr" rid="B18">2003</xref>). <italic>H. vastatrix</italic> samples used for FCM are described in Table <xref ref-type="table" rid="T1">1</xref>.</p>
</sec>
<sec>
<title>Genome and transcriptome sequencing and assembly</title>
<p>Hva urediniospore samples were scraped from infected coffee leaves taking care to sample very young pustules with no evidence of the presence of the hyperparasitic fungus <italic>Lecanicillium lecanii</italic>. The coffee genotypes sampled for Hva and the sequencing technologies used are described in Table <xref ref-type="table" rid="T2">2</xref>. DNA was extracted using the DNeasy Plant Mini-Kit (Qiagen, Hilden, Germany); <italic>H. vastatrix</italic> DNA samples were used to construct 100 bp paired-end libraries and sequenced by Illumina&#x02122; HiSeq 2000 at BGI in China. Single-end libraries were sequenced by ROCHE&#x02122; 454 GS FLX Titanium method at Macrogen in Korea.</p>
<p>Reads were subjected to quality control checks using FastQC (Babraham Bioinformatics, Babraham Institute), trimmed using the CLC quality_trim script (CLC bio, Aarhus, Denmark), masked or filtered by low complexity end regions, and exclusion of reads shorter than 70 nucleotides. Mdust and SeqClean were used for the cleaning process (The Gene Index Project, Harvard University&#x02014;<ext-link ext-link-type="uri" xlink:href="http://sourceforge.net/projects/seqclean/files/">http://sourceforge.net/projects/seqclean/files/</ext-link>). Trimmed and filtered reads were assembled with the CLC Assembly Cell v4.0.1 (CLC bio, Aarhus, Denmark) with the following parameters: deletions penalty &#x0003D; 3, no global alignment, remove duplicates, min contig length &#x0003D; 200 bp, paired-end distance &#x0003D; 200&#x02013;400 bp. The quality of the assembly was assessed with CLC tools (clc_assembly_viewer, assembly_info) and in-house R scripts available at (<ext-link ext-link-type="uri" xlink:href="http://bioinformatics.cenicafe.org/index.php/wiki/Third_Hybrid_Assembly_of_454_and_Illumina_data_with_CLC">http://bioinformatics.cenicafe.org/index.php/wiki/Third_Hybrid_Assembly_of_454_and_Illumina_data_with_CLC</ext-link>).</p>
<p>The hybrid assembly was analyzed using MEGAN 4 (Huson et al., <xref ref-type="bibr" rid="B33">2001</xref>) to assess the level of possible contamination and to perform a first approximation of the biological communities associated with Hva on the coffee leaf. Blastx was performed using the contigs from the hybrid assembly (Illumina &#x0002B; 454 short reads) (396,264 contigs) against the NCBI non-redundant protein database. An <italic>E</italic>-value of 10e<sup>&#x02212;3</sup> was used as a cut-off following the recommendation from the MEGAN developers. MEGAN was used to map and visualize the Low Common Ancestor (LCA) in the NCBI tree taxonomy for each contig. With the aim of filtering out putative contaminated sequences, contigs that presented similarities to reported fungal sequences were extracted to form a reliable set of Hva genome contigs. The reliable set of <italic>H. vastatrix</italic> genome contigs was compared against the <italic>P</italic>. <italic>graminis</italic> f.sp. <italic>tritici</italic> and <italic>P. pachyrhizi</italic> mitochondrial genomes using Blastn (with an <italic>E</italic>-value threshold of 1E<sup>&#x02212;5</sup>).</p>
<p>For RNA-seq sample preparation, Hva urediniospores were scraped from infected coffee leaves of the coffee genotypes described in Table <xref ref-type="supplementary-material" rid="SM1">S3</xref>, taking care to sample very young pustules with no evidence of the presence of the hyperparasitic fungus <italic>Lecanicillium lecanii</italic>. RNA was extracted from urediniospores using the RNeasy Plant Mini Kit (Qiagen, Valencia, CA, USA). Normalized library construction was performed at Evrogen, Moscow, Russia using Kamchatka crab duplex-specific nuclease (Zhulidov et al., <xref ref-type="bibr" rid="B80">2004</xref>). First-strand cDNA was prepared from poly(A)&#x0002B; <italic>H. vastatrix</italic> urediniospores RNA using a SMART&#x02122; PCR cDNA Synthesis Kit (Clontech), according to the manufacturer&#x00027;s protocol. SMART&#x02122; Oligo II and CDS primers (Clontech) were used for first-strand cDNA synthesis. A 1.5 ml aliquot of a 100 ng/ml of the first-strand cDNA solution was incubated for normalization with 0.25 Kunitz units of duplex-specific nuclease from kamchatka crab and amplified by PCR. Sequencing of amplified cDNA products was performed on an Illumina&#x02122; HiSeq 2000 system (BGI, Shenzhen, 518083, China).</p>
<p>RNA-seq data were filtered before assembly. The quality of the transcripts was measured using the FASTX-Toolkit, reads were trimmed by quality and duplicates were removed. Clean reads longer than 200bp were assembled using the Trinity package (Grabherr et al., <xref ref-type="bibr" rid="B27">2011</xref>). First, the reads were run through Trinity&#x00027;s Inchworm module, which assembles the read data set into different pools of reads, and the Chrysalis module was used to construct de Brujin graphs for all the read pools obtained using Inchworm. We used the module Butterfly that reconciles de Brujin graphs using the read pools from the former modules and output assembled contigs. We mapped Hva transcript datasets to the HvHybrid 454-Illumina assembly and we also compared transcripts against the NR database to identify plant, bacterial and other contaminant sequences.</p>
</sec>
<sec>
<title>Transposable elements prediction</title>
<p>We surveyed the frequency and classes of TE-like elements present in the HvHybrid assembly using the algorithm RepeatMasker (Smit et al., <xref ref-type="bibr" rid="B65">1996-2004</xref>) and the RepBase12.12 and fngrep.ref databases. The fngrep.ref database included 1726 transposable elements identified in fungi. Novel retrotransposon families were manually annotated from the gene families identified with OrthoMCL (see below).</p>
</sec>
<sec>
<title>Gene prediction</title>
<p>For the prediction of gene models, we followed the &#x0201C;align then assemble&#x0201D; approach (Martin and Wang, <xref ref-type="bibr" rid="B45">2011</xref>). We mapped RNA-seq short reads to the genome using TopHat (Trapnell et al., <xref ref-type="bibr" rid="B76">2009</xref>), and we identified putative transcriptional units using Augustus (Stanke and Waack, <xref ref-type="bibr" rid="B70">2003</xref>). Protein sequences were computationally deduced from the transcriptional units. Gene families from predicted proteins larger than 70 amino acids were identified with OrthoMCL using a default MCL inflation value of 1.5 and a blastp <italic>e</italic>-value of 10e<sup>&#x02212;5</sup> (Li et al., <xref ref-type="bibr" rid="B40">2003</xref>). We explored the set of predicted proteins, searching for KOGs using the CD-Search Tool and the Conserved Domain Database (<ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/Structure/cdd/cdd.shtml">www.ncbi.nlm.nih.gov/Structure/cdd/cdd.shtml</ext-link>).</p>
</sec>
<sec>
<title>Comparative genomics</title>
<p>The Hva genome contigs were aligned against the genomes of <italic>P. graminis</italic>, <italic>M. larici</italic>-<italic>populina</italic> and <italic>U. maydis</italic> using Mauve (Darling et al., <xref ref-type="bibr" rid="B15">2004</xref>). The Low Collinear Block (LCB) values were set through visual inspection by searching the best block size for each pair of alignments (largest coverage of both genomes). Finally, values used for LCB were as follows: <italic>P. graminis</italic> 12,154, <italic>M. larici</italic>-<italic>populina</italic> 10,409, and <italic>U. maydis</italic> 1203.</p>
<p>For genome annotation, we used custom Perl scripts and basic bioinformatics software such as BLAST (Altschul et al., <xref ref-type="bibr" rid="B2">1990</xref>). The databases we used for comparisons corresponded to 67,118 Pucciniales sequences comprising 16,694 protein-coding genes from <italic>M. larici-populina</italic> (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>), 22,815 <italic>P. striiformis</italic> f.sp. <italic>tritici</italic> sequences (Cantu et al., <xref ref-type="bibr" rid="B6">2011</xref>), 15,979 <italic>P. graminis</italic> f.sp. <italic>tritici</italic> sequences (Duplessis et al., <xref ref-type="bibr" rid="B20">2011</xref>), and 11,630 <italic>P. triticina</italic> sequences (Xu et al., <xref ref-type="bibr" rid="B78">2011</xref>).</p>
<p>For homology searches of protein kinases (PKs) we run BLASTp (version 2.2.28) with an <italic>e</italic> &#x0003D; 1e<sup>&#x02212;10</sup>. We searched <italic>H. vastatrix</italic> predicted proteins against 131 predicted PKs from <italic>Sacharomyces cerevisiae</italic> and then we compared the coffee rust PKs against <italic>M. laricis-populina</italic>, <italic>P. striiformis</italic> f.sp <italic>tritici</italic>, <italic>P. graminis</italic> f.sp <italic>tritici</italic>, <italic>P. triticina</italic>, and <italic>U. maydis</italic> predicted PKs.</p>
</sec>
<sec>
<title>Secreted proteins</title>
<p>The <italic>H. vastatrix</italic> predicted proteins were classified into secreted and non-secreted proteins. For this task, the programs SignalP 4.0 (Petersen et al., <xref ref-type="bibr" rid="B51">2011</xref>) and PProwler (Hawkins and Boden, <xref ref-type="bibr" rid="B31">2006</xref>) were used to predict putatively secreted proteins. A 0.9 probability cut-off was used for PProwler predictions. A set of secreted proteins predicted previously for <italic>H. vastatrix</italic> by Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>) was used for comparison with our predictions. Briefly, a Blastp was performed between our set of <italic>H. vastatrix</italic> proteins and the predictions by Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>). Finally, a set of proteins that showed similarity (Blastp <italic>e</italic> &#x0003D; 1e<sup>&#x02212;5</sup>) with the secreted proteins predicted by Fernandez et al. (<xref ref-type="bibr" rid="B23">2012</xref>) was obtained. Reciprocal comparisons of the three sets of secreted proteins were performed (SignalP, PProwler and Fernandez-Blastp) to establish the proteins shared by the three predictions.</p>
</sec>
</sec>
<sec>
<title>Availability</title>
<p>Raw data and metadata for the Genome project is available at NCBI, BioProject ID: PRJNA188788 and the Transcriptome project ID: PRJEB2960. Predicted and secreted proteins are available at <ext-link ext-link-type="uri" xlink:href="http://bioinformatics.cenicafe.org/index.php/wiki/CoffeeRustPredictedProteins">http://bioinformatics.cenicafe.org/index.php/wiki/CoffeeRustPredictedProteins</ext-link>.</p>
<p>The hybrid reference assembled genome contigs are available for download at: <ext-link ext-link-type="uri" xlink:href="http://bioinformatics.cenicafe.org/index.php/wiki/CoffeeRustHybridDraftAssembly_Contigs">http://bioinformatics.cenicafe.org/index.php/wiki/CoffeeRustHybridDraftAssembly_Contigs</ext-link>.</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p></sec>
</sec>
</body>
<back>
<ack>
<p>The authors wish to thank the National Federation of Coffee Growers of Colombia, the Ministry of Agriculture and Rural Development and the Colombian Administrative Department of Science, Technology and Innovation&#x02014;Colciencias for financial support. Authors would also like to thank Perttu Terho from the Centre for Biotechnology, University of Turku, Finland for data analysis from the flow cytometer experiment. Diego Mauricio Ria&#x000F1;o-Pach&#x000F3;n acknowledges funding provided by the Faculty of Sciences at Universidad de los Andes through the Assistant Professor Support Program.</p>
</ack>
<sec sec-type="supplementary-material" id="s5">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://www.frontiersin.org/journal/10.3389/fpls.2014.00594/abstract">http://www.frontiersin.org/journal/10.3389/fpls.2014.00594/abstract</ext-link></p>
<supplementary-material xlink:href="DataSheet1.XLSX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aime</surname> <given-names>C.</given-names></name> <name><surname>Matheny</surname> <given-names>P. B.</given-names></name> <name><surname>Henk</surname> <given-names>D. A.</given-names></name> <name><surname>Frieders</surname> <given-names>E. M.</given-names></name> <name><surname>Nilsson</surname> <given-names>R. H.</given-names></name> <name><surname>Piepenbring</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2006</year>). <article-title>An overview of the higher-level classification of Pucciniomycotina based on combined analyses of nuclear large and small subunit rDNA sequences</article-title>. <source>Mycologia</source> <volume>98</volume>, <fpage>896</fpage>&#x02013;<lpage>905</lpage>. <pub-id pub-id-type="doi">10.3852/mycologia.98.6.896</pub-id><pub-id pub-id-type="pmid">17486966</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Altschul</surname> <given-names>S. F.</given-names></name> <name><surname>Gish</surname> <given-names>W.</given-names></name> <name><surname>Miller</surname> <given-names>W.</given-names></name> <name><surname>Myers</surname> <given-names>E. W.</given-names></name> <name><surname>Lipman</surname> <given-names>D. J.</given-names></name></person-group> (<year>1990</year>). <article-title>Basic local alignment search tool</article-title>. <source>J. Mol. Biol</source>. <volume>215</volume>, <fpage>403</fpage>&#x02013;<lpage>410</lpage>. <pub-id pub-id-type="pmid">2231712</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alvarado</surname> <given-names>G.</given-names></name> <name><surname>Moreno</surname> <given-names>G.</given-names></name></person-group> (<year>2005</year>). <article-title>Cambio de la virulencia de <italic>Hemileia vastatrix</italic> en progenies de Caturra x H&#x000ED;brido de Timor</article-title>. <source>Cenicafe</source> <volume>56</volume>, <fpage>110</fpage>&#x02013;<lpage>126</lpage>.</citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cantu</surname> <given-names>D.</given-names></name> <name><surname>Govindarajulu</surname> <given-names>M.</given-names></name> <name><surname>Kozik</surname> <given-names>A.</given-names></name> <name><surname>Wang</surname> <given-names>M.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Kojima</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Next generation sequencing provides rapid access to the genome of <italic>Puccinia striiformis</italic> f.sp. <italic>tritici</italic>, the causal agent of wheat stripe rust</article-title>. <source>PLoS ONE</source> <volume>6</volume>:<fpage>e24230</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0024230</pub-id><pub-id pub-id-type="pmid">21909385</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cantu</surname> <given-names>D.</given-names></name> <name><surname>Segovia</surname> <given-names>V.</given-names></name> <name><surname>MacLean</surname> <given-names>D.</given-names></name> <name><surname>Bayles</surname> <given-names>R.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Kamoun</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Genome analyses of the wheat yellow (stripe) rust pathogen <italic>Puccinia striiformis</italic> f.sp. <italic>tritici</italic> reveal polymorphic and haustorial expressed secreted proteins as candidate effectors</article-title>. <source>BMC Genomics</source> <volume>14</volume>:<fpage>270</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-14-270</pub-id><pub-id pub-id-type="pmid">23607900</pub-id></citation>
</ref>
<ref id="B8">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Carvalho</surname> <given-names>A.</given-names></name> <name><surname>Eskes</surname> <given-names>A. B.</given-names></name> <name><surname>Castillo</surname> <given-names>J.</given-names></name> <name><surname>Sreenivasan</surname> <given-names>M.</given-names></name> <name><surname>Echeverri</surname> <given-names>J.</given-names></name> <name><surname>Fernandez</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>1987</year>). <article-title>Breeding programs</article-title>, in <source>Coffee Rust: Epidemiology, Resistance, and Management</source>, eds <person-group person-group-type="editor"><name><surname>Kushalappa</surname> <given-names>A. C.</given-names></name> <name><surname>Eskes</surname> <given-names>A. B.</given-names></name></person-group> (<publisher-loc>Boca Raton, FL</publisher-loc>: <publisher-name>CRC Press</publisher-name>), <fpage>293</fpage>&#x02013;<lpage>336</lpage></citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carvalho</surname> <given-names>C. R.</given-names></name> <name><surname>Fernandes</surname> <given-names>R. C.</given-names></name> <name><surname>Carvalho</surname> <given-names>G. M. A.</given-names></name> <name><surname>Barreto</surname> <given-names>R. W.</given-names></name> <name><surname>Evans</surname> <given-names>H. C.</given-names></name></person-group> (<year>2011</year>). <article-title>Cryptosexuality and the genetic diversity paradox in coffee rust, <italic>Hemileia vastatrix</italic></article-title>. <source>PLoS ONE</source> <volume>6</volume>:<fpage>e26387</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0026387</pub-id><pub-id pub-id-type="pmid">22102860</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carvalho</surname> <given-names>G. M. A.</given-names></name> <name><surname>Carvalho</surname> <given-names>C. R.</given-names></name> <name><surname>Barreto</surname> <given-names>R. W.</given-names></name> <name><surname>Evans</surname> <given-names>H. C.</given-names></name></person-group> (<year>2014</year>). <article-title>Coffee rust genome measured using flow cytometry: does size matter?</article-title> <source>Plant Pathol</source>. <volume>63</volume>, <fpage>1022</fpage>&#x02013;<lpage>1026</lpage>. <pub-id pub-id-type="doi">10.1111/ppa.12175</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Castillo</surname> <given-names>J.</given-names></name> <name><surname>Leguizam&#x000F3;n</surname> <given-names>J.</given-names></name></person-group> (<year>1992</year>). <article-title>Virulencia de <italic>Hemileia vastatrix</italic> determinada por medio de plantas diferenciales de caf&#x000E9; en Colombia</article-title>. <source>Cenicafe</source> <volume>43</volume>, <fpage>114</fpage>&#x02013;<lpage>124</lpage></citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Catanzariti</surname> <given-names>A. M.</given-names></name> <name><surname>Dodds</surname> <given-names>P. N.</given-names></name> <name><surname>Lawrence</surname> <given-names>G. J.</given-names></name> <name><surname>Ayliffe</surname> <given-names>M. A.</given-names></name> <name><surname>Ellis</surname> <given-names>J. G.</given-names></name></person-group> (<year>2006</year>). <article-title>Haustorially expressed secreted proteins from flax rust are highly enriched for avirulence elicitors</article-title>. <source>Plant Cell</source> <volume>18</volume>, <fpage>243</fpage>&#x02013;<lpage>256</lpage>. <pub-id pub-id-type="doi">10.1105/tpc.105.035980</pub-id><pub-id pub-id-type="pmid">16326930</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cressey</surname> <given-names>D.</given-names></name></person-group> (<year>2013</year>). <article-title>Coffee rust regains foothold</article-title>. <source>Nature</source> <volume>493</volume>, <fpage>587</fpage>. <pub-id pub-id-type="doi">10.1038/493587a</pub-id><pub-id pub-id-type="pmid">23364717</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cristancho</surname> <given-names>M. A.</given-names></name> <name><surname>Rozo</surname> <given-names>Y.</given-names></name> <name><surname>Escobar</surname> <given-names>Y.</given-names></name> <name><surname>Rivillas</surname> <given-names>C. A.</given-names></name> <name><surname>Gait&#x000E1;n</surname> <given-names>A. L.</given-names></name></person-group> (<year>2012</year>). <article-title>Outbreak of coffee leaf rust (<italic>Hemileia vastatrix</italic>) in Colombia</article-title>. <source>New Dis. Rep</source>. <volume>25</volume>, <fpage>2044</fpage>&#x02013;<lpage>0588</lpage>. <pub-id pub-id-type="doi">10.5197/j.2044-0588.2012.025.019</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Darling</surname> <given-names>A. C. E.</given-names></name> <name><surname>Mau</surname> <given-names>B.</given-names></name> <name><surname>Blattner</surname> <given-names>F. R.</given-names></name> <name><surname>Perna</surname> <given-names>N. T.</given-names></name></person-group> (<year>2004</year>). <article-title>Mauve: multiple alignment of conserved genomic sequence with rearrangements</article-title>. <source>Genome Res</source>. <volume>14</volume>, <fpage>1394</fpage>&#x02013;<lpage>1397</lpage>. <pub-id pub-id-type="doi">10.1101/gr.2289704</pub-id><pub-id pub-id-type="pmid">15231754</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Darzentas</surname> <given-names>N.</given-names></name></person-group> (<year>2010</year>). <article-title>Circoletto: visualizing sequence similarity with Circos</article-title>. <source>Bioinformatics</source> <volume>26</volume>, <fpage>2620</fpage>&#x02013;<lpage>2621</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btq484</pub-id><pub-id pub-id-type="pmid">20736339</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Castro</surname> <given-names>R.</given-names></name> <name><surname>Evans</surname> <given-names>H. C.</given-names></name> <name><surname>Barreto</surname> <given-names>R. W.</given-names></name></person-group> (<year>2009</year>). <article-title>Confirmation of the occurrence of teliospores of <italic>Hemileia vastatrix</italic> in Brazil with observations on their mode of germination</article-title>. <source>Trop. Plant Pathol</source>. <volume>34</volume>, <fpage>108</fpage>&#x02013;<lpage>113</lpage>. <pub-id pub-id-type="doi">10.1590/S1982-56762009000200005</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dolezel</surname> <given-names>J.</given-names></name> <name><surname>Bartos</surname> <given-names>J.</given-names></name> <name><surname>Voglmayr</surname> <given-names>H.</given-names></name> <name><surname>Greilhuber</surname> <given-names>J.</given-names></name></person-group> (<year>2003</year>). <article-title>Nuclear DNA content and genome size of trout and human</article-title>. <source>Cytometry A</source> <volume>51</volume>, <fpage>127</fpage>&#x02013;<lpage>128</lpage>. <pub-id pub-id-type="doi">10.1002/cyto.a.10013</pub-id><pub-id pub-id-type="pmid">12541287</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Duplessis</surname> <given-names>S.</given-names></name> <name><surname>Bakkeren</surname> <given-names>G.</given-names></name> <name><surname>Hamelin</surname> <given-names>R.</given-names></name></person-group> (<year>2014</year>). <article-title>Advancing knowledge on biology of rust fungi through genomics</article-title>. <source>Adv. Bot. Res</source>. <volume>70</volume>, <fpage>173</fpage>&#x02013;<lpage>209</lpage>. <pub-id pub-id-type="doi">10.1016/B978-0-12-397940-7.00006-9</pub-id></citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Duplessis</surname> <given-names>S.</given-names></name> <name><surname>Cuomo</surname> <given-names>C. A.</given-names></name> <name><surname>Lin</surname> <given-names>Y. C.</given-names></name> <name><surname>Aerts</surname> <given-names>A.</given-names></name> <name><surname>Tisserant</surname> <given-names>E.</given-names></name> <name><surname>Veneault-Fourrey</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Obligate biotrophy features unraveled by the genomic analysis of rust fungi</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A</source>. <volume>108</volume>, <fpage>9166</fpage>&#x02013;<lpage>9171</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1019315108</pub-id><pub-id pub-id-type="pmid">21536894</pub-id></citation>
</ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eddy</surname> <given-names>S. R.</given-names></name></person-group> (<year>2011</year>). <article-title>Accelerated profile HMM searches</article-title>. <source>PLoS Comp. Biol</source>. <volume>7</volume>:<fpage>e1002195</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pcbi.1002195</pub-id><pub-id pub-id-type="pmid">22039361</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eilam</surname> <given-names>T.</given-names></name> <name><surname>Bushnell</surname> <given-names>W. R.</given-names></name> <name><surname>Anikster</surname> <given-names>Y.</given-names></name></person-group> (<year>1994</year>). <article-title>Relative nuclear DNA content of rust fungi estimated by flow cytometry of Propydium iodide-stained pycniospores</article-title>. <source>Phytopathology</source> <volume>84</volume>, <fpage>728</fpage>&#x02013;<lpage>735</lpage>. <pub-id pub-id-type="doi">10.1094/Phyto-82-1212</pub-id></citation>
</ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fernandez</surname> <given-names>D.</given-names></name> <name><surname>Tisserant</surname> <given-names>E.</given-names></name> <name><surname>Talhinhas</surname> <given-names>P.</given-names></name> <name><surname>Azinheira</surname> <given-names>H.</given-names></name> <name><surname>Vieira</surname> <given-names>A.</given-names></name> <name><surname>Petitot</surname> <given-names>A. S.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>454-pyrosequencing of <italic>Coffea arabica</italic> leaves infected by the rust fungus <italic>Hemileia vastatrix</italic> reveals in planta-expressed pathogen-secreted proteins and plant functions in a late compatible plant&#x02013;rust interaction</article-title>. <source>Mol. Plant Pathol</source>. <volume>13</volume>, <fpage>17</fpage>&#x02013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1111/j.1364-3703.2011.00723.x</pub-id><pub-id pub-id-type="pmid">21726390</pub-id></citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gil</surname> <given-names>L. F.</given-names></name> <name><surname>Ocampo</surname> <given-names>J. D.</given-names></name></person-group> (<year>1998</year>). <article-title>Identificaci&#x000F3;n de la raza XXII (V5-6) de <italic>Hemileia vastatrix</italic> Berk. y Br. en Colombia</article-title>. <source>Cenicaf&#x000E9;</source> <volume>49</volume>, <fpage>340</fpage>&#x02013;<lpage>344</lpage></citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gouveia</surname> <given-names>M.</given-names></name> <name><surname>Ribeiro</surname> <given-names>A.</given-names></name> <name><surname>V&#x000E1;rzea</surname> <given-names>V.</given-names></name> <name><surname>Rodrigues</surname> <given-names>C. J.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>2005</year>). <article-title>Genetic diversity in <italic>Hemileia vastatrix</italic> based on RAPD markers</article-title>. <source>Mycologia</source> <volume>97</volume>, <fpage>396</fpage>&#x02013;<lpage>404</lpage>. <pub-id pub-id-type="doi">10.3852/mycologia.97.2.396</pub-id><pub-id pub-id-type="pmid">16396347</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grabherr</surname> <given-names>M. G.</given-names></name> <name><surname>Haas</surname> <given-names>B. J.</given-names></name> <name><surname>Yassour</surname> <given-names>M.</given-names></name> <name><surname>Levin</surname> <given-names>J. Z.</given-names></name> <name><surname>Thompson</surname> <given-names>D. A.</given-names></name> <name><surname>Amit</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Full-length transcriptome assembly from RNA-Seq data without a reference genome</article-title>. <source>Nat. Biotechnol</source>. <volume>29</volume>, <fpage>644</fpage>&#x02013;<lpage>652</lpage>. <pub-id pub-id-type="doi">10.1038/nbt.1883</pub-id><pub-id pub-id-type="pmid">21572440</pub-id></citation>
</ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gu</surname> <given-names>B.</given-names></name> <name><surname>Shiv</surname> <given-names>D.</given-names></name> <name><surname>Kale</surname> <given-names>Q. W.</given-names></name> <name><surname>Dinghe</surname> <given-names>W.</given-names></name> <name><surname>Qiaona</surname> <given-names>P.</given-names></name> <name><surname>Hua</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Rust secreted protein Ps87 is conserved in diverse fungal pathogens and contains a RXLR-like motif sufficient for translocation into plant cells</article-title>. <source>PLoS ONE</source> <volume>6</volume>:<fpage>e27217</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0027217</pub-id><pub-id pub-id-type="pmid">22076138</pub-id></citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hacquard</surname> <given-names>S.</given-names></name> <name><surname>Joly</surname> <given-names>D. L.</given-names></name> <name><surname>Lin</surname> <given-names>Y. G.</given-names></name> <name><surname>Tisserant</surname> <given-names>E.</given-names></name> <name><surname>Feau</surname> <given-names>N.</given-names></name> <name><surname>Delaruelle</surname> <given-names>C.</given-names></name> <etal/></person-group>. (<year>2012</year>). <article-title>A comprehensive analysis of genes encoding small secreted proteins identifies candidate effectors in <italic>Melampsora larici-populina</italic> (Poplar Leaf Rust)</article-title>. <source>Mol. Plant Microbe Interact</source>. <volume>25</volume>, <fpage>279</fpage>&#x02013;<lpage>293</lpage>. <pub-id pub-id-type="doi">10.1094/MPMI-09-11-0238</pub-id><pub-id pub-id-type="pmid">22046958</pub-id></citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hawkins</surname> <given-names>J.</given-names></name> <name><surname>Boden</surname> <given-names>M.</given-names></name></person-group> (<year>2006</year>). <article-title>Detecting and sorting targeting peptides with recurrent networks and support vector machines</article-title>. <source>J. Bioinform. Comput. Biol</source>. <volume>4</volume>, <fpage>1</fpage>&#x02013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1142/S0219720006001771</pub-id><pub-id pub-id-type="pmid">16568539</pub-id></citation>
</ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huang</surname> <given-names>J.</given-names></name> <name><surname>Si</surname> <given-names>W.</given-names></name> <name><surname>Deng</surname> <given-names>Q.</given-names></name> <name><surname>Li</surname> <given-names>P.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name></person-group> (<year>2014</year>). <article-title>Rapid evolution of avirulence genes in rice blast fungus <italic>Magnaporthe oryzae</italic></article-title>. <source>BMC Genet</source>. <volume>15</volume>:<fpage>45</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2156-15-45</pub-id><pub-id pub-id-type="pmid">24725999</pub-id></citation>
</ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huson</surname> <given-names>D. H.</given-names></name> <name><surname>Mitra</surname> <given-names>S.</given-names></name> <name><surname>Weber</surname> <given-names>N.</given-names></name> <name><surname>Ruscheweyh</surname> <given-names>H.</given-names></name> <name><surname>Schuster</surname> <given-names>S. C.</given-names></name></person-group> (<year>2001</year>). <article-title>Integrative analysis of environmental sequences using MEGAN4</article-title>. <source>Genome Res</source>. <volume>21</volume>, <fpage>1552</fpage>&#x02013;<lpage>1560</lpage>. <pub-id pub-id-type="doi">10.1101/gr.120618.111</pub-id><pub-id pub-id-type="pmid">21690186</pub-id></citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Joly</surname> <given-names>D. L.</given-names></name> <name><surname>Feau</surname> <given-names>N.</given-names></name> <name><surname>Tanguay</surname> <given-names>P.</given-names></name> <name><surname>Hamelin</surname> <given-names>R. C.</given-names></name></person-group> (<year>2010</year>). <article-title>Comparative analysis of secreted protein evolution using expressed sequence tags from four poplar leaf rusts (<italic>Melampsora</italic> spp.)</article-title>. <source>BMC Genomics</source> <volume>11</volume>:<fpage>422</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-11-422</pub-id><pub-id pub-id-type="pmid">20615251</pub-id></citation>
</ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kemen</surname> <given-names>E.</given-names></name> <name><surname>Jones</surname> <given-names>J. D.</given-names></name></person-group> (<year>2012</year>). <article-title>Obligate biotroph parasitism: can we link genomes to lifestyles?</article-title> <source>Trends Plant Sci</source>. <volume>17</volume>, <fpage>448</fpage>&#x02013;<lpage>457</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2012.04.005</pub-id><pub-id pub-id-type="pmid">22613788</pub-id></citation>
</ref>
<ref id="B38">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leguizam&#x000F3;n</surname> <given-names>J. E.</given-names></name> <name><surname>Baeza</surname> <given-names>C. A.</given-names></name> <name><surname>Fern&#x000E1;ndez</surname> <given-names>O.</given-names></name> <name><surname>Moreno</surname> <given-names>G.</given-names></name> <name><surname>Castillo</surname> <given-names>Z. J.</given-names></name> <name><surname>Orozco</surname> <given-names>F. J.</given-names></name></person-group> (<year>1984</year>). <article-title>Identification of race II of <italic>Hemileia vastatrix</italic> Berk y Br. in Colombia</article-title>. <source>Cenicaf&#x000E9;</source> <volume>35</volume>, <fpage>26</fpage>&#x02013;<lpage>28</lpage></citation>
</ref>
<ref id="B40">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>L.</given-names></name> <name><surname>Stoeckert</surname> <given-names>C. J.</given-names> <suffix>Jr.</suffix></name> <name><surname>Roos</surname> <given-names>D. S.</given-names></name></person-group> (<year>2003</year>). <article-title>OrthoMCL: identification of ortholog groups for eukaryotic genomes</article-title>. <source>Genome Res</source>. <volume>13</volume>, <fpage>2178</fpage>&#x02013;<lpage>2189</lpage>. <pub-id pub-id-type="doi">10.1101/gr.1224503</pub-id><pub-id pub-id-type="pmid">12952885</pub-id></citation>
</ref>
<ref id="B42">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x000E7;ais</surname> <given-names>G.</given-names></name> <name><surname>Kingsford</surname> <given-names>C.</given-names></name></person-group> (<year>2011</year>). <article-title>A fast, lock-free approach for efficient parallel counting of occurrences of <italic>k</italic>-mers</article-title>. <source>Bioinformatics</source> <volume>27</volume>, <fpage>764</fpage>&#x02013;<lpage>770</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr011</pub-id><pub-id pub-id-type="pmid">21217122</pub-id></citation>
</ref>
<ref id="B43">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname> <given-names>F.</given-names></name> <name><surname>Aerts</surname> <given-names>A.</given-names></name> <name><surname>Ahr&#x000E9;n</surname> <given-names>D.</given-names></name> <name><surname>Brun</surname> <given-names>A.</given-names></name> <name><surname>Danchin</surname> <given-names>E. G.</given-names></name> <name><surname>Duchaussoy</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2008</year>). <article-title>The genome of <italic>Laccaria bicolor</italic> provides insights into mycorrhizal symbiosis</article-title>. <source>Nature</source> <volume>452</volume>, <fpage>88</fpage>&#x02013;<lpage>92</lpage>. <pub-id pub-id-type="doi">10.1038/nature06556</pub-id><pub-id pub-id-type="pmid">18322534</pub-id></citation>
</ref>
<ref id="B44">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname> <given-names>F.</given-names></name> <name><surname>Kohler</surname> <given-names>A.</given-names></name> <name><surname>Murat</surname> <given-names>C.</given-names></name> <name><surname>Balestrini</surname> <given-names>R.</given-names></name> <name><surname>Coutinho</surname> <given-names>P. M.</given-names></name> <name><surname>Jaillon</surname> <given-names>O.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>P&#x000E9;rigord black truffle genome uncovers evolutionary origins and mechanisms of symbiosis</article-title>. <source>Nature</source> <volume>464</volume>, <fpage>1033</fpage>&#x02013;<lpage>1038</lpage>. <pub-id pub-id-type="doi">10.1038/nature08867</pub-id><pub-id pub-id-type="pmid">20348908</pub-id></citation>
</ref>
<ref id="B45">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Martin</surname> <given-names>J. A.</given-names></name> <name><surname>Wang</surname> <given-names>Z.</given-names></name></person-group> (<year>2011</year>). <article-title>Next-generation transcriptome assembly</article-title>. <source>Nat. Rev. Genet</source>. <volume>12</volume>, <fpage>671</fpage>&#x02013;<lpage>682</lpage>. <pub-id pub-id-type="doi">10.1038/nrg3068</pub-id><pub-id pub-id-type="pmid">21897427</pub-id></citation>
</ref>
<ref id="B46">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Miranda</surname> <given-names>D.</given-names></name> <name><surname>Barton</surname> <given-names>G. J.</given-names></name></person-group> (<year>2007</year>). <article-title>Classification and functional annotation of eukaryotic protein kinases</article-title>. <source>Proteins</source> <volume>68</volume>, <fpage>893</fpage>&#x02013;<lpage>914</lpage>. <pub-id pub-id-type="doi">10.1002/prot.21444</pub-id><pub-id pub-id-type="pmid">17557329</pub-id></citation>
</ref>
<ref id="B47">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Monaco</surname> <given-names>L. C.</given-names></name></person-group> (<year>1977</year>). <article-title>Consequences of the introduction of coffee rust into Brazil</article-title>. <source>Ann. N.Y. Acad. Sci</source>. <volume>287</volume>, <fpage>57</fpage>&#x02013;<lpage>71</lpage>. <pub-id pub-id-type="doi">10.1111/j.1749-6632.1977.tb34231.x</pub-id></citation>
</ref>
<ref id="B48">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nemri</surname> <given-names>A.</given-names></name> <name><surname>Saunders</surname> <given-names>D. G.</given-names></name> <name><surname>Anderson</surname> <given-names>C.</given-names></name> <name><surname>Upadhyaya</surname> <given-names>N. M.</given-names></name> <name><surname>Win</surname> <given-names>J.</given-names></name> <name><surname>Lawrence</surname> <given-names>G. J.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>The genome sequence and effector complement of the flax rust pathogen <italic>Melampsora lini</italic></article-title>. <source>Front. Plant Sci</source>. <volume>5</volume>:<issue>98</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2014.00098</pub-id><pub-id pub-id-type="pmid">24715894</pub-id></citation>
</ref>
<ref id="B49">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parlange</surname> <given-names>F.</given-names></name> <name><surname>Oberhaensli</surname> <given-names>S.</given-names></name> <name><surname>Breen</surname> <given-names>J.</given-names></name> <name><surname>Platzer</surname> <given-names>M.</given-names></name> <name><surname>Taudien</surname> <given-names>S.</given-names></name> <name><surname>&#x00160;imkov&#x000E1;</surname> <given-names>H.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>A major invasion of transposable elements accounts for the large size of the <italic>Blumeria graminis</italic> f.sp. <italic>tritici</italic> genome</article-title>. <source>Funct. Integr. Genomics</source> <volume>11</volume>, <fpage>671</fpage>&#x02013;<lpage>677</lpage>. <pub-id pub-id-type="doi">10.1007/s10142-011-0240-5</pub-id><pub-id pub-id-type="pmid">21809124</pub-id></citation>
</ref>
<ref id="B50">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parra</surname> <given-names>G.</given-names></name> <name><surname>Bradnam</surname> <given-names>K.</given-names></name> <name><surname>Korf</surname> <given-names>I.</given-names></name></person-group> (<year>2007</year>). <article-title>CEGMA: a pipeline to accurately annotate core genes in eukaryotic genomes</article-title>. <source>Bioinformatics</source> <volume>23</volume>, <fpage>1061</fpage>&#x02013;<lpage>1067</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btm071</pub-id><pub-id pub-id-type="pmid">17332020</pub-id></citation>
</ref>
<ref id="B51">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Petersen</surname> <given-names>T.</given-names></name> <name><surname>Brunak</surname> <given-names>S.</given-names></name> <name><surname>von Heijne</surname> <given-names>G.</given-names></name> <name><surname>Nielsen</surname> <given-names>H.</given-names></name></person-group> (<year>2011</year>). <article-title>SignalP 4.0: discriminating signal peptides from transmembrane regions</article-title>. <source>Nat. Methods</source> <volume>8</volume>, <fpage>785</fpage>&#x02013;<lpage>786</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.1701</pub-id><pub-id pub-id-type="pmid">21959131</pub-id></citation>
</ref>
<ref id="B52">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pretsch</surname> <given-names>K.</given-names></name> <name><surname>Kemen</surname> <given-names>A.</given-names></name> <name><surname>Kemen</surname> <given-names>E.</given-names></name> <name><surname>Geiger</surname> <given-names>M.</given-names></name> <name><surname>Mendgen</surname> <given-names>K.</given-names></name> <name><surname>Voegele</surname> <given-names>R.</given-names></name></person-group> (<year>2013</year>). <article-title>The rust transferred proteins-a new family of effector proteins exhibiting protease inhibitor function</article-title>. <source>Mol. Plant Pathol</source>. <volume>14</volume>, <fpage>96</fpage>&#x02013;<lpage>107</lpage>. <pub-id pub-id-type="doi">10.1111/j.1364-3703.2012.00832.x</pub-id><pub-id pub-id-type="pmid">22998218</pub-id></citation>
</ref>
<ref id="B53">
<citation citation-type="web"><person-group person-group-type="author"><collab>Puccinia Group Genomes Database.</collab></person-group> Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.broadinstitute.org/annotation/genome/puccinia_group/GenomeDescriptions.html&#x00023;P_triticina_1_1_V1">http://www.broadinstitute.org/annotation/genome/puccinia_group/GenomeDescriptions.html&#x00023;P_triticina_1_1_V1</ext-link>.</citation>
</ref>
<ref id="B55">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Raffaele</surname> <given-names>S.</given-names></name> <name><surname>Kamoun</surname> <given-names>S.</given-names></name></person-group> (<year>2012</year>). <article-title>Genome evolution in filamentous plant pathogens: why bigger can be better</article-title>. <source>Nat. Rev. Microbiol</source>. <volume>10</volume>, <fpage>417</fpage>&#x02013;<lpage>430</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro2790</pub-id><pub-id pub-id-type="pmid">22565130</pub-id></citation>
</ref>
<ref id="B56">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Rivillas</surname> <given-names>C.</given-names></name> <name><surname>Serna</surname> <given-names>C.</given-names></name> <name><surname>Cristancho</surname> <given-names>M.</given-names></name> <name><surname>Gait&#x000E1;n</surname> <given-names>A.</given-names></name></person-group> (<year>2011</year>). <source>Roya del Cafeto en Colombia: Impacto, Manejo y Costos del Control</source>. <publisher-loc>Chinchin&#x000E1;</publisher-loc>: <publisher-name>Bolet&#x000ED;n T&#x000E9;cnico No. 36, Cenicafe</publisher-name>.</citation>
</ref>
<ref id="B57">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rodrigues</surname> <given-names>C. J.</given-names> <suffix>Jr.</suffix></name> <name><surname>Bettencourt</surname> <given-names>A. J.</given-names></name> <name><surname>Rijo</surname> <given-names>L.</given-names></name></person-group> (<year>1975</year>). <article-title>Races of the pathogen and resistance to coffee rust</article-title>. <source>Ann. Rev. Phytopathol</source>. <volume>13</volume>, <fpage>49</fpage>&#x02013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.py.13.090175.000405</pub-id></citation>
</ref>
<ref id="B58">
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Rodrigues</surname> <given-names>C. J.</given-names> <suffix>Jr.</suffix></name> <name><surname>V&#x000E1;rzea</surname> <given-names>V.</given-names></name> <name><surname>Godinho</surname> <given-names>I. L.</given-names></name> <name><surname>Palma</surname> <given-names>S.</given-names></name> <name><surname>Rato</surname> <given-names>R. C.</given-names></name></person-group> (<year>1993</year>). <article-title>New physiologic races of <italic>Hemileia vastatrix</italic></article-title>, in <source>Proceedings of the 15th International Conference on Coffee Science</source> (<publisher-loc>Montpellier</publisher-loc>), <fpage>318</fpage>&#x02013;<lpage>321</lpage>.</citation>
</ref>
<ref id="B59">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rozo</surname> <given-names>Y.</given-names></name> <name><surname>Escobar</surname> <given-names>C.</given-names></name> <name><surname>Gait&#x000E1;n</surname> <given-names>A. L.</given-names></name> <name><surname>Cristancho</surname> <given-names>M. A.</given-names></name></person-group> (<year>2012</year>). <article-title>Aggressiveness and genetic diversity of <italic>Hemileia vastatrix</italic> during an epidemic in Colombia</article-title>. <source>J. Phytopathol</source>. <volume>160</volume>, <fpage>732</fpage>&#x02013;<lpage>740</lpage>. <pub-id pub-id-type="doi">10.1111/jph.12024</pub-id></citation>
</ref>
<ref id="B60">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saunders</surname> <given-names>D. G. O.</given-names></name> <name><surname>Win</surname> <given-names>J.</given-names></name> <name><surname>Cano</surname> <given-names>L. M.</given-names></name> <name><surname>Szabo</surname> <given-names>L. J.</given-names></name> <name><surname>Kamoun</surname> <given-names>S.</given-names></name> <name><surname>Rafaelle</surname> <given-names>S.</given-names></name></person-group> (<year>2012</year>). <article-title>Using hierarchical clustering of secreted protein families to classify and rank candidate effectors of rust fungi</article-title>. <source>PLoS ONE</source> <volume>7</volume>:<fpage>e29847</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0029847</pub-id><pub-id pub-id-type="pmid">22238666</pub-id></citation>
</ref>
<ref id="B63">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schirawski</surname> <given-names>J.</given-names></name> <name><surname>Mannhaupt</surname> <given-names>G.</given-names></name> <name><surname>M&#x000FC;nch</surname> <given-names>K.</given-names></name> <name><surname>Brefort</surname> <given-names>T.</given-names></name> <name><surname>Schipper</surname> <given-names>K.</given-names></name> <name><surname>Doehlemann</surname> <given-names>G.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Pathogenicity determinants in smut fungi revealed by genome comparison</article-title>. <source>Science</source> <volume>330</volume>, <fpage>1546</fpage>&#x02013;<lpage>1548</lpage>. <pub-id pub-id-type="doi">10.1126/science.1195330</pub-id><pub-id pub-id-type="pmid">21148393</pub-id></citation>
</ref>
<ref id="B65">
<citation citation-type="web"><person-group person-group-type="author"><name><surname>Smit</surname> <given-names>A.</given-names></name> <name><surname>Hubley</surname> <given-names>R.</given-names></name> <name><surname>Green</surname> <given-names>P.</given-names></name></person-group> (<year>1996-2004</year>). <source>RepeatMasker Open-3.0</source>. Available online at: <ext-link ext-link-type="uri" xlink:href="http://www.repeatmasker.org">http://www.repeatmasker.org</ext-link>.</citation>
</ref>
<ref id="B66">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Spanu</surname> <given-names>P. D.</given-names></name></person-group> (<year>2012</year>). <article-title>The genomics of obligate (and nonobligate) biotrophs</article-title>. <source>Annu. Rev. Phytopathol</source>. <volume>50</volume>, <fpage>91</fpage>&#x02013;<lpage>109</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-phyto-081211-173024</pub-id><pub-id pub-id-type="pmid">22559067</pub-id></citation>
</ref>
<ref id="B67">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Spanu</surname> <given-names>P. D.</given-names></name> <name><surname>Abbott</surname> <given-names>J. C.</given-names></name> <name><surname>Amselem</surname> <given-names>J.</given-names></name> <name><surname>Burgis</surname> <given-names>T. A.</given-names></name> <name><surname>Soanes</surname> <given-names>D. M.</given-names></name> <name><surname>St&#x000FC;ber</surname> <given-names>K.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Genome expansion and gene loss in powdery mildew fungi reveal tradeoffs in extreme parasitism</article-title>. <source>Science</source> <volume>330</volume>, <fpage>1543</fpage>&#x02013;<lpage>1546</lpage>. <pub-id pub-id-type="doi">10.1126/science.1194573</pub-id><pub-id pub-id-type="pmid">21148392</pub-id></citation>
</ref>
<ref id="B68">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stajich</surname> <given-names>J. E.</given-names></name> <name><surname>Wilke</surname> <given-names>S.</given-names></name> <name><surname>Ahr&#x000E9;n</surname> <given-names>D.</given-names></name> <name><surname>Au</surname> <given-names>C. A.</given-names></name> <name><surname>Birren</surname> <given-names>B. W.</given-names></name> <name><surname>Borodovsky</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2010</year>). <article-title>Insights into evolution of multicellular fungi from the assembled chromosomes of the mushroom <italic>Coprinopsis cinerea</italic> (<italic>Coprinus cinereus</italic>)</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A</source>. <volume>107</volume>, <fpage>11889</fpage>&#x02013;<lpage>11894</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1003391107</pub-id><pub-id pub-id-type="pmid">20547848</pub-id></citation>
</ref>
<ref id="B70">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Waack</surname> <given-names>S.</given-names></name></person-group> (<year>2003</year>). <article-title>Gene prediction with a hidden Markov model and a new intron submodel</article-title>. <source>Bioinformatics</source> <volume>19</volume>(<supplement>Suppl. 2</supplement>), <fpage>ii215</fpage>&#x02013;<lpage>ii225</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btg1080</pub-id><pub-id pub-id-type="pmid">14534192</pub-id></citation>
</ref>
<ref id="B71">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stone</surname> <given-names>C. L.</given-names></name> <name><surname>Buitrago</surname> <given-names>M. L.</given-names></name> <name><surname>Boore</surname> <given-names>J. L.</given-names></name> <name><surname>Frederick</surname> <given-names>R. D.</given-names></name></person-group> (<year>2010</year>). <article-title>Analysis of the complete mitochondrial genome sequences of the soybean rust pathogens <italic>Phakopsora pachyrhizi</italic> and <italic>P. meibomiae</italic></article-title>. <source>Mycologia</source> <volume>102</volume>, <fpage>887</fpage>&#x02013;<lpage>897</lpage>. <pub-id pub-id-type="doi">10.3852/09-198</pub-id><pub-id pub-id-type="pmid">20648755</pub-id></citation>
</ref>
<ref id="B72">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>X.</given-names></name> <name><surname>Le</surname> <given-names>H. D.</given-names></name> <name><surname>Wahlstrom</surname> <given-names>J. M.</given-names></name> <name><surname>Karpen</surname> <given-names>G. H.</given-names></name></person-group> (<year>2003</year>). <article-title>Sequence analysis of a functional Drosophila centromere</article-title>. <source>Genome Res</source>. <volume>13</volume>, <fpage>182</fpage>&#x02013;<lpage>194</lpage>. <pub-id pub-id-type="doi">10.1101/gr.681703</pub-id><pub-id pub-id-type="pmid">12566396</pub-id></citation>
</ref>
<ref id="B73">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Talhinhas</surname> <given-names>P.</given-names></name> <name><surname>Azinheira</surname> <given-names>H.</given-names></name> <name><surname>Vieira</surname> <given-names>B.</given-names></name> <name><surname>Loureiro</surname> <given-names>A.</given-names></name> <name><surname>Tavares</surname> <given-names>S.</given-names></name> <name><surname>Batista</surname> <given-names>D.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Overview of the functional virulent genome of the coffee leaf rust pathogen <italic>Hemileia vastatrix</italic> with an emphasis on early stages of infection</article-title>. <source>Front. Plant Sci</source>. <volume>5</volume>:<issue>88</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2014.00088</pub-id><pub-id pub-id-type="pmid">24672531</pub-id></citation>
</ref>
<ref id="B74">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tavares</surname> <given-names>S.</given-names></name> <name><surname>Ramos</surname> <given-names>A. P.</given-names></name> <name><surname>Pires</surname> <given-names>A. S.</given-names></name> <name><surname>Azinheira</surname> <given-names>H. G.</given-names></name> <name><surname>Caldeirinha</surname> <given-names>P.</given-names></name> <name><surname>Link</surname> <given-names>T.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Genome size analyses of Pucciniales reveal the largest fungal genomes</article-title>. <source>Front. Plant Sci</source>. <volume>5</volume>:<issue>422</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2014.00422</pub-id><pub-id pub-id-type="pmid">25206357</pub-id></citation>
</ref>
<ref id="B75">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tisserant</surname> <given-names>E.</given-names></name> <name><surname>Malbreil</surname> <given-names>M.</given-names></name> <name><surname>Kuo</surname> <given-names>A.</given-names></name> <name><surname>Kohler</surname> <given-names>A.</given-names></name> <name><surname>Symeonidi</surname> <given-names>A.</given-names></name> <name><surname>Balestrini</surname> <given-names>R.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Genome of an arbuscular mycorrhizal fungus provides insight into the oldest plant symbiosis</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A</source>. <volume>110</volume>, <fpage>20117</fpage>&#x02013;<lpage>20122</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1313452110</pub-id><pub-id pub-id-type="pmid">24277808</pub-id></citation>
</ref>
<ref id="B76a">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Toome</surname> <given-names>M.</given-names></name> <name><surname>Ohm</surname> <given-names>R. A.</given-names></name> <name><surname>Riley</surname> <given-names>R. W.</given-names></name> <name><surname>James</surname> <given-names>T. Y.</given-names></name> <name><surname>Lazarus</surname> <given-names>K. L.</given-names></name> <name><surname>Henrissat</surname> <given-names>B.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Genome sequencing provides insight into the reproductive biology, nutritional mode and ploidy of the fern pathogen <italic>Mixia osmundae</italic></article-title>. <source>New Phytol</source>. <volume>202</volume>, <fpage>554</fpage>&#x02013;<lpage>564</lpage>. <pub-id pub-id-type="doi">10.1111/nph.12653</pub-id><pub-id pub-id-type="pmid">24372469</pub-id></citation>
</ref>
<ref id="B76">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Trapnell</surname> <given-names>C.</given-names></name> <name><surname>Pachter</surname> <given-names>L.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2009</year>). <article-title>TopHat: discovering splice junctions with RNA-Seq</article-title>. <source>Bioinformatics</source> <volume>25</volume>, <fpage>1105</fpage>&#x02013;<lpage>1111</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp120</pub-id><pub-id pub-id-type="pmid">19289445</pub-id></citation>
</ref>
<ref id="B77">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>McCallum</surname> <given-names>B.</given-names></name></person-group> (<year>2009</year>). <article-title>Fusion body formation, germ tube anastomosis, and nuclear migration during the germination of urediniospores of the wheat leaf rust fungus, <italic>Puccinia triticina</italic></article-title>. <source>Phytopathology</source> <volume>99</volume>, <fpage>1355</fpage>&#x02013;<lpage>1364</lpage>. <pub-id pub-id-type="doi">10.1094/PHYTO-99-12-1355</pub-id><pub-id pub-id-type="pmid">19900001</pub-id></citation>
</ref>
<ref id="B78">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Xu</surname> <given-names>J.</given-names></name> <name><surname>Linning</surname> <given-names>R.</given-names></name> <name><surname>Fellers</surname> <given-names>J.</given-names></name> <name><surname>Dickinson</surname> <given-names>M.</given-names></name> <name><surname>Zhu</surname> <given-names>W.</given-names></name> <name><surname>Antonov</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2011</year>). <article-title>Gene discovery in EST sequences from the wheat leaf rust fungus <italic>Puccinia triticina</italic> sexual spores, asexual spores and haustoria, compared to other rust and corn smut fungi</article-title>. <source>BMC Genomics</source> <volume>12</volume>:<fpage>161</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2164-12-161</pub-id><pub-id pub-id-type="pmid">21435244</pub-id></citation>
</ref>
<ref id="B79">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>W.</given-names></name> <name><surname>Huang</surname> <given-names>L.</given-names></name> <name><surname>Huang</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>X.</given-names></name> <name><surname>Zhao</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>High genome heterozygosity and endemic genetic recombination in the wheat stripe rust fungus</article-title>. <source>Nat. Commun</source>. <volume>4</volume>:<fpage>2673</fpage>. <pub-id pub-id-type="doi">10.1038/ncomms3673</pub-id><pub-id pub-id-type="pmid">24150273</pub-id></citation>
</ref>
<ref id="B80">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhulidov</surname> <given-names>P. A.</given-names></name> <name><surname>Bogdanova</surname> <given-names>E. A.</given-names></name> <name><surname>Shcheglov</surname> <given-names>A. S.</given-names></name> <name><surname>Vagner</surname> <given-names>L. L.</given-names></name> <name><surname>Khaspekov</surname> <given-names>G. L.</given-names></name> <name><surname>Kozhemyako</surname> <given-names>V. B.</given-names></name> <etal/></person-group>. (<year>2004</year>). <article-title>Simple cDNA normalization using kamchatka crab duplex-specific nuclease</article-title>. <source>Nucleic Acids Res</source>. <volume>32</volume>:<fpage>e3</fpage>. <pub-id pub-id-type="doi">10.1093/nar/gnh031</pub-id><pub-id pub-id-type="pmid">14973331</pub-id></citation>
</ref>
</ref-list>
</back>
</article>
