<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2018.00344</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Revisiting <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic>, Causative Agent of Tularemia in Germany With Bioinformatics: New Insights in Genome Structure, DNA Methylation and Comparative Phylogenetic Analysis</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name><surname>Busch</surname> <given-names>Anne</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/502029/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Thomas</surname> <given-names>Prasad</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zuchantke</surname> <given-names>Eric</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/514481/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Brendebach</surname> <given-names>Holger</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/522603/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Neubert</surname> <given-names>Kerstin</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/8763/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gruetzke</surname> <given-names>Josephine</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Al Dahouk</surname> <given-names>Sascha</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/402697/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Peters</surname> <given-names>Martin</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Hotzel</surname> <given-names>Helmut</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/390539/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Neubauer</surname> <given-names>Heinrich</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/404391/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Tomaso</surname> <given-names>Herbert</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Institute of Bacterial Infections and Zoonoses, Friedrich-Loeffler-Institut</institution>, <addr-line>Jena</addr-line>, <country>Germany</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Biological Safety, German Federal Institute for Risk Assessment</institution>, <addr-line>Berlin</addr-line>, <country>Germany</country></aff>
<aff id="aff3"><sup>3</sup><institution>Algorithmic Bioinformatics, Department of Mathematics and Computer Science, Institute of Computer Science, Freie Universit&#x00E4;t Berlin</institution>, <addr-line>Berlin</addr-line>, <country>Germany</country></aff>
<aff id="aff4"><sup>4</sup><institution>Standort Arnsberg, Chemisches und Veterin&#x00E4;runtersuchungsamt Westfalen</institution>, <addr-line>Arnsberg</addr-line>, <country>Germany</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: <italic>Steve Lindemann, Purdue University, United States</italic></p></fn>
<fn fn-type="edited-by"><p>Reviewed by: <italic>Jason Sahl, Northern Arizona University, United States; Max Maurin, Universit&#x00E9; Grenoble Alpes, France; Jean Challacombe, Los Alamos National Laboratory (DOE), United States</italic></p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x002A;Correspondence: <italic>Anne Busch, <email>anne.busch@fli.de</email></italic></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Systems Microbiology, a section of the journal Frontiers in Microbiology</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>13</day>
<month>03</month>
<year>2018</year>
</pub-date>
<pub-date pub-type="collection">
<year>2018</year>
</pub-date>
<volume>9</volume>
<elocation-id>344</elocation-id>
<history>
<date date-type="received">
<day>05</day>
<month>12</month>
<year>2017</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>02</month>
<year>2018</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2018 Busch, Thomas, Zuchantke, Brendebach, Neubert, Gruetzke, Al Dahouk, Peters, Hotzel, Neubauer and Tomaso.</copyright-statement>
<copyright-year>2018</copyright-year>
<copyright-holder>Busch, Thomas, Zuchantke, Brendebach, Neubert, Gruetzke, Al Dahouk, Peters, Hotzel, Neubauer and Tomaso</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p><italic>Francisella</italic> (<italic>F.</italic>) <italic>tularensis</italic> is a highly virulent, Gram-negative bacterial pathogen and the causative agent of the zoonotic disease tularemia. Here, we generated, analyzed and characterized a high quality circular genome sequence of the <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050 that caused fatal tularemia in a hare. Besides the genomic structure, we focused on the analysis of oriC, unique to the <italic>Francisella</italic> genus and regulating replication in and outside hosts and the first report on genomic DNA methylation of a <italic>Francisella</italic> strain. The high quality genome was used to establish and evaluate a diagnostic whole genome sequencing pipeline. A genotyping strategy for <italic>F. tularensis</italic> was developed using various bioinformatics tools for genotyping. Additionally, whole genome sequences of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> isolates isolated in the years 2008&#x2013;2015 in Germany were generated. A phylogenetic analysis allowed to determine the genetic relatedness of these isolates and confirmed the highly conserved nature of <italic>F. tularensis</italic> subsp. <italic>holarctica.</italic></p>
</abstract>
<kwd-group>
<kwd><italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic></kwd>
<kwd>genome analysis</kwd>
<kwd>tularemia</kwd>
<kwd>high quality genome</kwd>
<kwd>phylogeny</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="100"/>
<page-count count="15"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec><title>Introduction</title>
<p><italic>Francisella (F.) tularensis</italic> is a small, highly infectious, Gram-negative, fastidious bacterial pathogen and the causative agent of tularemia (<xref ref-type="bibr" rid="B32">Ellis et al., 2002</xref>). Tularemia is a zoonosis that can be transmitted to humans through infected blood-feeding arthropods or by ingestion or inhalation of <italic>F. tularensis</italic>. Human infections with <italic>F. tularensis</italic> occur through skin occulation after handling infected animals and occasional through laboratory infections. <italic>F. tularensis</italic> is listed as a category A bioterrorism agent, because the infectious dose is very low and the resulting febrile disease may be severe to fatal. It requires prompt antibiotic treatment to avoid strong complications (<xref ref-type="bibr" rid="B72">Rotz et al., 2002</xref>; <xref ref-type="bibr" rid="B52">Maurin, 2015</xref>). The two subspecies <italic>F. tularensis</italic> subsp. <italic>tularensis</italic> and <italic>F.</italic>
<italic>tularensis</italic> subsp. <italic>holarctica</italic> are the major causes of tularemia in humans (<xref ref-type="bibr" rid="B43">Kingry and Petersen, 2014</xref>). Only the less pathogenic <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> is endemic in Europe (<xref ref-type="bibr" rid="B88">T&#x00E4;rnvik and Berglund, 2003</xref>). In Germany and France most human infections are caused by contact with infected European brown hares (<italic>Lepus europaeus</italic>) (<xref ref-type="bibr" rid="B59">M&#x00FC;ller et al., 2013</xref>; <xref ref-type="bibr" rid="B68">Robert-Koch-Institut, 2015</xref>; <xref ref-type="bibr" rid="B56">Moinet et al., 2016</xref>). <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> appears to be a re-emerging pathogen in Germany infecting many animal species and arthropod vectors like ticks (<xref ref-type="bibr" rid="B59">M&#x00FC;ller et al., 2013</xref>; <xref ref-type="bibr" rid="B63">Otto et al., 2015</xref>; <xref ref-type="bibr" rid="B68">Robert-Koch-Institut, 2015</xref>).</p>
<p>Most <italic>Francisella</italic> species share many biological and genomic attributes, but the genetic and functional differences significantly influence virulence and pathogenicity (<xref ref-type="bibr" rid="B40">Jones et al., 2012</xref>, <xref ref-type="bibr" rid="B39">2014</xref>; <xref ref-type="bibr" rid="B92">Ulland et al., 2013</xref>). It is known that <italic>F. tularensis</italic> is a facultative intracellular pathogen infecting a wide variety of cells (<xref ref-type="bibr" rid="B64">Ozanic et al., 2015</xref>). Following uptake into the macrophage, the bacteria at first reside within a phagosome, but then rapidly escapes into the cytoplasm. Adaptation to the specialized intracellular lifestyle is associated with evolutionary loss of genes for many metabolic pathways, but <italic>F. tularensis</italic> has retained or evolved mechanisms to efficiently acquire essential nutrients within the host (<xref ref-type="bibr" rid="B9">Barker et al., 2009</xref>; <xref ref-type="bibr" rid="B26">de Bruin et al., 2011</xref>).</p>
<p>All <italic>Francisella</italic> isolates (including <italic>F. tularensis</italic> subsp. <italic>tularensis</italic>, <italic>F. tularensis</italic> subsp. <italic>holarctica</italic>, <italic>F. novicida)</italic> reside in the environment or in a variety of animal hosts. They have small conserved genomes of about 2 Mb. <italic>F. tularensis</italic> strains have a high degree of genetic similarity with an average nucleotide identity of &#x2265;97.7% (<xref ref-type="bibr" rid="B48">Larsson et al., 2009</xref>). Nevertheless, differences are apparent between their respective genomes, genome sizes and protein coding genes. Genome sequencing and analysis has been performed on several <italic>F. tularensis</italic> strains, with a limited number of genomes fully assembled and annotated. Although it is known that <italic>F. tularensis</italic> has methylated DNA (<xref ref-type="bibr" rid="B31">Elkins et al., 1999</xref>), DNA methylation analysis was not done yet with other previously sequenced strains. The analysis of DNA methylation can elucidate its role in gene regulation. DNA methylation protects the integrity of prokaryote genomes, but also plays a role in chromosome replication, nucleotide segregation, DNA repair, and transcription (<xref ref-type="bibr" rid="B97">Wion and Casadesus, 2006</xref>; <xref ref-type="bibr" rid="B60">Murray et al., 2012</xref>; <xref ref-type="bibr" rid="B46">Kumar and Rao, 2013</xref>). Bacterial DNA from <italic>F. tularensis</italic> (LVS) containing unmethylated CpG motifs triggers an activation of B-cells but no activation when the DNA is methylated (<xref ref-type="bibr" rid="B31">Elkins et al., 1999</xref>). The methylation of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> hence might play a key role in the pathogenic stealth mechanisms of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> in macrophages (<xref ref-type="bibr" rid="B21">Champion, 2011</xref>). Thus, single-molecule real-time (SMRT) sequencing that reveals methylation throughout the genome is a powerful tool for the investigation of this pathogen. We report here the first methylation analysis of a <italic>F. tularensis</italic> genome based on a hybrid assembly using two sequencing technologies (long reads and short reads) and thus high in quality. We assessed the phylogeny of this strain with samples from the same region in North Rhine-Westphalia (Germany) collected in the years 2008&#x2013;2015. An analysis pipeline was established by using this high quality genome to evaluate the best approaches for short read assembly and genome annotation. The microbial phylogeny of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> could be generated. In the first step the inclusion into the tree of life was targeted. The classification into the phylogenetic tree of life is necessary to allow for an exact classification of new and unknown bacterial species. In a second step the analysis with MLST<sup>+</sup> and Parsnp as reference-independent molecular typing tools enabled a novel detailed view on <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> epidemiology for the <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> 12T0050 in the related regional setting.</p>
</sec>
<sec id="s1" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec><title>Bacterial Strains</title>
<p>The bacterial <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050 used in the present study as a reference strain was isolated on cysteine heart agar (CHA, Becton Deckinson, BD Heidelberg, Germany) from a carcass of a hare (<italic>Lepus europaeus</italic>) found during an outbreak in 2012 near Herringhausen (North Rhine-Westphalia, Germany). The strain was assigned to clade B.6, subclade B.18 using a set of real-time PCR assays (<xref ref-type="bibr" rid="B68">Robert-Koch-Institut, 2015</xref>; <xref ref-type="bibr" rid="B89">Tomaso et al., 2017</xref>). Subsequent whole genome sequencing and bioinformatics analysis using CanSNPer<sup><xref ref-type="fn" rid="fn01">1</xref></sup>, which is an assay for whole genome sequencing based on canonical single nucleotide polymorphisms (canSNPs) based on whole genome sequences developed by <xref ref-type="bibr" rid="B47">Larkeryd et al. (2014)</xref> confirmed clade B.6. The cultivation of bacteria from organ specimens was performed on cysteine heart agar at 37&#x00B0;C with 5% CO<sub>2</sub> for 48 h.</p>
<p>For phylogenetic analysis, bacterial strains were chosen from the collection of strains and sequences maintained at the Friedrich-Loeffler-Institut, Institute of Bacterial Infections and Zoonoses, Jena, Germany. The selection included 14 strains collected in the years 2009&#x2013;2015 in a region close to the outbreak in 2012 in North Rhine-Westphalia (Germany). All strains were identified by MALDI-TOF MS (<xref ref-type="bibr" rid="B80">Seibold et al., 2007</xref>; <xref ref-type="bibr" rid="B59">M&#x00FC;ller et al., 2013</xref>) and PCR assays and assigned to genetic clades and subclades using real-time PCR assay that target canSNPs and INDELs as described in (<xref ref-type="bibr" rid="B89">Tomaso et al., 2017</xref>) and shown in <bold>Table <xref ref-type="table" rid="T1">1</xref></bold>. The whole genome sequences were analyzed with the canSNPer tool (<xref ref-type="bibr" rid="B47">Larkeryd et al., 2014</xref>). The reference strain FSC237, <italic>F. tularensis</italic> subsp. <italic>tularensis</italic> SCHU S4 (NC_006570.2), a known human pathogen, was sequenced and assembled to be included as an outlier (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). <italic>F. tularensis</italic> subsp. <italic>tularensis</italic> was cultivated under BSL-3 conditions, <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strains were handled under BSL-2 conditions in accordance with German biosafety regulations. The isolates were inactivated at 95&#x00B0;C for 20 min.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p><italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> isolates from North Rhine-Westphalia (Germany) with qPCR and canSNPer results, year of collection, and district of isolation. (x; no result obtained).</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Sample ID</th>
<th valign="top" align="center">Clade, qPCR</th>
<th valign="top" align="center">Subclade, qPCR</th>
<th valign="top" align="center">canSNPer</th>
<th valign="top" align="center">Collection Date</th>
<th valign="top" align="center">District</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">09T0179</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.51</td>
<td valign="top" align="center">2009</td>
<td valign="top" align="center">Geseke</td>
</tr>
<tr>
<td valign="top" align="left">10T0115</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">x</td>
<td valign="top" align="center">2010</td>
<td valign="top" align="center">Waltrop</td>
</tr>
<tr>
<td valign="top" align="left">10T0192</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.51</td>
<td valign="top" align="center">2010</td>
<td valign="top" align="center">Geseke</td>
</tr>
<tr>
<td valign="top" align="left">10T0193</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.51</td>
<td valign="top" align="center">2010</td>
<td valign="top" align="center">Geseke</td>
</tr>
<tr>
<td valign="top" align="left">11T0309</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.49</td>
<td valign="top" align="center">2011</td>
<td valign="top" align="center">Soest</td>
</tr>
<tr>
<td valign="top" align="left">12T0002</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.45</td>
<td valign="top" align="center">2012</td>
<td valign="top" align="center">Huels</td>
</tr>
<tr>
<td valign="top" align="left"><bold>12T0050</bold></td>
<td valign="top" align="center"><bold>B.6</bold></td>
<td valign="top" align="center"><bold>B.18</bold></td>
<td valign="top" align="center"><bold>B.X</bold></td>
<td valign="top" align="center"><bold>2012</bold></td>
<td valign="top" align="center"><bold>Herringhausen</bold></td>
</tr>
<tr>
<td valign="top" align="left">12T0062</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.62</td>
<td valign="top" align="center">2012</td>
<td valign="top" align="center">Lippstadt</td>
</tr>
<tr>
<td valign="top" align="left">15T0012</td>
<td valign="top" align="center">B.12</td>
<td valign="top" align="center">B.34</td>
<td valign="top" align="center">B.26</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Hoexter</td>
</tr>
<tr>
<td valign="top" align="left">15T0013</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.62</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Hoexter</td>
</tr>
<tr>
<td valign="top" align="left">15T0014</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.62</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Paderborn</td>
</tr>
<tr>
<td valign="top" align="left">15T0016</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.11</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Lippe</td>
</tr>
<tr>
<td valign="top" align="left">15T0031</td>
<td valign="top" align="center">B.12</td>
<td valign="top" align="center">B.34</td>
<td valign="top" align="center">B.26</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Ostwestfalen-Lippe</td>
</tr>
<tr>
<td valign="top" align="left">15T0085</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.45</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Euskirchen</td>
</tr>
<tr>
<td valign="top" align="left">15T0086</td>
<td valign="top" align="center">B.6</td>
<td valign="top" align="center">B.18</td>
<td valign="top" align="center">B.49</td>
<td valign="top" align="center">2015</td>
<td valign="top" align="center">Euskirchen</td>
</tr>
<tr>
<td valign="top" align="left"></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic>Bold lettering is highlighting the isolate 12T0050.</italic></attrib>
</table-wrap-foot>
</table-wrap>
</sec>
<sec><title>DNA Extraction and Genome Sequencing</title>
<p>DNA for whole genome sequencing was prepared from a 10 mL culture in brain heart infusion broth (Brain, Heart Infusion Broth, Sifin, Berlin, Germany), Bacterial cells were harvested after 72 h by centrifugation, and the DNA was purified using QIAGEN Genomic-tip 20/G and a QIAGEN Genomic DNA buffer set kit (Qiagen, Hilden, Germany). DNA quality was examined by using a Qubit 2.0 fluorometer (Life technologies, Germany) and by agarose gel electrophoresis.</p>
</sec>
<sec><title>Sequencing, Assembly, Annotation and Genomic Analysis Tools</title>
<p>The isolate 12T0050 was subjected to PacBio sequencing, HiSeq and MiSeq sequencing on Illumina instruments and to Ion Torrent sequencing. IonTorrent Sequencing was performed with standard procedure with the AB library builder on Ion Torrent S5XL with 520 Chip. The genome sequencing analysis of strain 12T0050 was started with SMRT DNA sequencing (<xref ref-type="bibr" rid="B53">McCarthy, 2010</xref>) using a PacBio RSII sequencer at GATC Biotech (Germany). Genome assembly was carried out using the HGAP algorithm version 3 (RS_HGAP_Assembly.3) (<xref ref-type="bibr" rid="B25">Chin et al., 2013</xref>) implemented in PacBio SMRT portal version 2.3.0. The two SMRT<sup>&#x00AE;</sup> Cells were pooled together and assembled. Circularization of the genome sequence, represented by a single contig, and merging of the contig was carried out using Circlator (<xref ref-type="bibr" rid="B37">Hunt et al., 2015</xref>). The circular contig was polished with the RS_Resequencing.1 protocol available on the SMRT portal v2.3.0. Methylome analysis was done with RS_Modification_detection.1 and Modification_and_Motif_Analysis.1, both are also available in the SMRT portalv2.3.0. After circularization, the sequence was corrected with Illumina MiSeq data for the substitutions due to sequencing errors and for frameshifts to generate &#x201C;hybrid assemblies&#x201D; (software used from Boyke Bund, personal communication, available on request) and named 12T0050_FLI.</p>
<p>This optimized sequence of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> isolate 12T0050_FLI was used to compare the results of various assembly and annotation software solutions. For quality control and trimming of the sequencing reads the programs bbmap/bbduk suite (<xref ref-type="bibr" rid="B17">Bushnell, 2017</xref>) and sickle (<xref ref-type="bibr" rid="B76">Schirmer et al., 2015</xref>) were used. The following open source assembler programs were tested: SPAdes v. 3.9.1 (<xref ref-type="bibr" rid="B7">Bankevich et al., 2012</xref>) (with and without error correction in Bayes Hammer modes supported by GNU-parallelization (<xref ref-type="bibr" rid="B87">Tange, 2011</xref>), MaSuRCA 3.1.0 (<xref ref-type="bibr" rid="B100">Zimin et al., 2013</xref>), and ABySS 2.0.2 (<xref ref-type="bibr" rid="B81">Simpson et al., 2009</xref>). Additionally, the assembler of CLC (CLC Genomics Workbench 9.5.3)<sup><xref ref-type="fn" rid="fn02">2</xref></sup> was included, a commercially available software package with quality check and automated preprocessing. Analysis of the generated assembly was performed with QUAST 4.3 (<xref ref-type="bibr" rid="B35">Gurevich et al., 2013</xref>) with gene prediction using GeneMarkS Suite and Bandage 0.8.1 (<xref ref-type="bibr" rid="B96">Wick et al., 2015</xref>). All three short read sequencing technologies performed equally well, though longer read length in MiSeq data led to a reduction of contig numbers. The assembled contigs were tested with different annotation or gene identification algorithms and compared: Prokka annotation pipeline 1.12-beta in standard settings (<xref ref-type="bibr" rid="B78">Seemann, 2014</xref>), Rapid Annotation using Subsystem Technology (RAST) server and Glimmer 3, Glimmer HMM-3.0.3 (<xref ref-type="bibr" rid="B28">Delcher et al., 1999</xref>, <xref ref-type="bibr" rid="B27">2007</xref>; <xref ref-type="bibr" rid="B6">Aziz et al., 2008</xref>) and AUGUSTUS, an annotation tool, optimized for eukaryotes but also known to produce good annotations with prokaryotes (<xref ref-type="bibr" rid="B28">Delcher et al., 1999</xref>, <xref ref-type="bibr" rid="B27">2007</xref>; <xref ref-type="bibr" rid="B84">Stanke et al., 2006</xref>; <xref ref-type="bibr" rid="B6">Aziz et al., 2008</xref>; <xref ref-type="bibr" rid="B54">Meyer et al., 2008</xref>). Samples were tested for contaminations with Kraken version 0.10.6-unreleased (<xref ref-type="bibr" rid="B98">Wood and Salzberg, 2014</xref>) and manually curated to exclude samples with high contamination rates. We established a uniform protocol for all data, consisting of SPAdes assembly in the Bayes-Hammer mode, the filtering of contigs (removing contigs smaller than 500 bp and with less than 3 reads coverage) and Kraken testing.</p>
<p>For genomic analysis the origin of replication (oriC) was identified using ori-Finder (<xref ref-type="bibr" rid="B33">Gao and Zhang, 2008</xref>). CRISPR loci were searched using the CRISPR Recognition Tool version 1.1 (<xref ref-type="bibr" rid="B13">Bland et al., 2007</xref>). Prophage elements were searched by using PHAST (<xref ref-type="bibr" rid="B99">Zhou et al., 2011</xref>). Tandem repeats were searched for with a tandem repeat finder version 4.09 (<xref ref-type="bibr" rid="B12">Benson, 1999</xref>). Average nucleotide identity (ANI) was calculated with enveomics (<xref ref-type="bibr" rid="B70">Rodriguez-R and Konstantinidis, 2016</xref>). CpG islands were detected by EMBOSS in standard settings (<xref ref-type="bibr" rid="B67">Rice et al., 2000</xref>). Visualization was carried out using smrtview (<xref ref-type="bibr" rid="B25">Chin et al., 2013</xref>), Artemis (<xref ref-type="bibr" rid="B19">Carver et al., 2012</xref>), and DNAplotter (<xref ref-type="bibr" rid="B20">Carver et al., 2009</xref>). Methylation motif analysis was performed with Rebase (<xref ref-type="bibr" rid="B69">Roberts et al., 2015</xref>).</p>
<p>All other strains were subjected only to Illumina HiSeq and/or MiSeq sequencing using the Nextera XT DNA protocol for library preparation (GATC, Konstanz, Germany and BfR, Berlin, Germany). The number of reads after filtering ranged from 0.5 million to 5 million resulting in an average nucleotide coverage of >50 (see <bold>Supplementary Figure <xref ref-type="supplementary-material" rid="SM1">S1</xref></bold>).</p>
</sec>
<sec><title>Phylogenetic Analyses</title>
<p>To assess the phylogenetic classification of assorted <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> genomes, already published methods based on different bioinformatics approaches using whole genome sequence data were compared. All selected strains were characterized using a combination of independent methods including MALDI-TOF MS, conventional PCR and real-time PCR assays targeting INDEL loci and canSNPs as previously described (<xref ref-type="bibr" rid="B90">Tomaso et al., 2007</xref>; <xref ref-type="bibr" rid="B47">Larkeryd et al., 2014</xref>). The phylogenetic study included various species and subspecies within the genus, such as <italic>F. tularensis</italic> subsp. <italic>tularensis, F. tularensis</italic> subsp. <italic>novicida, F. philomiragia</italic>, and <italic>F. noatunensis, F. guangzhouensis</italic> (NC_006570.2, NZ_JOOT00000000.1, NZ_CP010427, NC_010336.1, NZ_LTDO00000000.1) retrieved from the NCBI database, as well as strains that are well characterized representatives of different clades of <italic>F. tularensis subsp. holarctica</italic>, i.e., clade B.4 (NC_017463), B.6 (NC_009749) and B.12 (NC_019551). As an outgroup an <italic>Escherichia coli</italic> (NC_002695) and a <italic>Salmonella enterica</italic> genome (NC_003198) were included. All genomes were assessed as assemblies and newly annotated with Prokka to allow for greater comparability.</p>
<p>Taxonomic classification was performed with 16S rRNA gene analysis using MOLE-BLAST (<xref ref-type="bibr" rid="B1">Altschul et al., 1997</xref>; <xref ref-type="bibr" rid="B30">Edgar, 2004</xref>) with standard settings excluding uncultured samples. The coding sequences for 16S rRNA were extracted with Geneious (<xref ref-type="bibr" rid="B42">Kearse et al., 2012</xref>). This was compared to PhyloPhlAn to include the samples into the tree of life. PhyloPhlAn was used with the annotation files resulting from Prokka and performed with standard setting on all samples. These two methods were generated distance matrices on fixed inputs and allowed database independent and sample size independent inclusion in the tree of life. These two methods were compared to SeqSphere and ParsSNP. SeqSphere, a commercially available multilocus sequence typing tool based on the core genome analysis, was used as described (<xref ref-type="bibr" rid="B3">Antwerpen et al., 2015</xref>) and compared to the open source software Parsnp v1.2, a command-line-tool for efficient microbial core genome alignment. This program uses SNP detection as part of the Harvest suite in standard setting (<xref ref-type="bibr" rid="B91">Treangen et al., 2014</xref>). Core genome of the genome sequences are used to create a multiple meta-alignment file. A maximum likelihood tree was generated with Randomized Accelerated Maximum Likelihood, RaxML (<xref ref-type="bibr" rid="B83">Stamatakis, 2014</xref>) in GTRGAMMA model and a bootstrap number of 500. Figures were generated using Dendroscope (<xref ref-type="bibr" rid="B38">Huson et al., 2007</xref>). Here we used TempEst for the visualization and analysis of temporally sampled sequence data (<xref ref-type="bibr" rid="B66">Rambaut et al., 2016</xref>).</p>
</sec>
</sec>
<sec><title>Results</title>
<sec><title>Genome Compilation</title>
<p>To establish a complete reference genome <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> isolate 12T0050 was sequenced by applying SMRT<sup>&#x00AE;</sup> Technology. The sequencing approach with 2 flow cells yielded 20 116 reads with a total of 253 596 265 bases, 24 647 reads, an average length of 11477 bases. The total runtime including data transfer and analysis was 172 min. Resequencing resulted in an average reference bases called of 100 and 99.9% concordance and average reference coverage of 114.3. The Hierachical Genome Assembly Process (HGAP) resulted in a single contig of 1890609 bp The GC-content was 32.2%. The chromosome assembly was generated in Circlator and was visualized with the Artemis Comparison Tool (<bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). High quality genome sequence was made using a hybrid approach involving both long and short reads, whereby the long reads were used for initial assembly and was subsequently corrected using short reads to remove insertion/deletions that occur with long reads alone based assembly approach. The corrections were made accordingly as the Miseq data were mapped with bwa v.0.7.12-r1039, variants were called with varscan v2.3 and the consensus was generated with GATK v.3.7.0-gcfedb67 (<xref ref-type="bibr" rid="B44">Koboldt et al., 2009</xref>; <xref ref-type="bibr" rid="B50">Li and Durbin, 2010</xref>; <xref ref-type="bibr" rid="B93">Van der Auwera et al., 2013</xref>). It is denoted 12T0050_FLI. It is submitted as <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> 12T0050_FLI under the BioProject <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="PRJNA422969">PRJNA422969</ext-link>, BioSample <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="SAMN08201031">SAMN08201031</ext-link>, Accession number <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="CP025778">CP025778</ext-link>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Plot of the complete <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> 12T0050. The genome consists of 1890738 base pairs and 2114 predicted coding sequences. The circles represent from the inside: 1, GC skew (red above and black below zero, 10 kb window); 2, GC content (blue above and black below genome average of 32.20%, 10 kb window); 3, strand-specific genome-wide methylation analyzed in 10 kb windows; 4, strand-specific methylation per gene; 5, scale in million base pairs (Mb). Methylation color spectrum goes from blue (minimum, 5%) over yellow (mean, 12.5%) to red (maximum, 23%).</p></caption>
<graphic xlink:href="fmicb-09-00344-g001.tif"/>
</fig>
</sec>
<sec><title>Genome Assembly</title>
<p>With 12T0050_FLI we assessed the best short-read assembly strategy to set out (see <bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM2">S1</xref></bold>). All assemblers were evaluated for contig size, gene content and overall quality. First, the preprocessing was evaluated aiming for quality score based read filtering, base trimming, and removal of contaminations caused by phiX and adapter sequences. Preprocessing (bbduk and sickle) did not result in a significant improvement of the assembly quality in respect to gene content or contig size. The SPAdes assembler in Bayes Hammer mode without preprocessing resulted in a comparable quality to other preprocessing methods. In the assembler comparison the MaSuRCA and ABySS over-and underestimated gene content and genome sizes up to 36%. Robust results were obtained with all sequencer platforms with the SPAdes assembler in Bayes&#x2013;Hammer mode, which was therefore regarded as the method of choice. An additional quality improvement was generated by excluding contigs that were smaller than 500 bp or had a coverage lower than 3 (using fastgrep.pl)<sup><xref ref-type="fn" rid="fn03">3</xref></sup>. CLC provided preprocessing and assemblies with comparable good results, but could not easily be included into a workflow with open source programs and was thus excluded.</p>
</sec>
<sec><title>Genome Annotation</title>
<p>Genome annotation on the reference genome of 12T0050_FLI with PROKKA resulted in 2114 CDS (Coding DNA sequences, that code for proteins) while RAST and AUGUSTUS resulted in 2141, GlimmerES in 6398 possible open reading frame rather than CDS as shown in <bold>Table <xref ref-type="table" rid="T2">2</xref></bold>.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Annotated features of the genome <italic>of F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050_FLI, generated with Glimmer, Prokka, RAST and Augustus.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Feature</th>
<th valign="top" align="center">Glimmer</th>
<th valign="top" align="center">Prokka</th>
<th valign="top" align="center">RAST</th>
<th valign="top" align="center">Augustus</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><bold>CDS<sup>&#x2217;</sup></bold></td>
<td valign="top" align="center">6398<sup>&#x2217;</sup></td>
<td valign="top" align="center"><bold>2114</bold></td>
<td valign="top" align="center">2141</td>
<td valign="top" align="center">2141</td>
</tr>
<tr>
<td valign="top" align="left"><bold>rRNA</bold></td>
<td valign="top" align="center">30</td>
<td valign="top" align="center"><bold>10</bold></td>
<td valign="top" align="center">48</td>
<td valign="top" align="center">20</td>
</tr>
<tr>
<td valign="top" align="left"><bold>tRNA</bold></td>
<td valign="top" align="center">114</td>
<td valign="top" align="center"><bold>38</bold></td>
<td valign="top" align="center">48</td>
<td valign="top" align="center">76</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Size</bold></td>
<td valign="top" align="center">1890815</td>
<td valign="top" align="center"><bold>1890815</bold></td>
<td valign="top" align="center">1890815</td>
<td valign="top" align="center">1890815</td>
</tr>
<tr>
<td valign="top" align="left"><bold>GC Content</bold></td>
<td valign="top" align="center">32.2%</td>
<td valign="top" align="center"><bold>32.2%</bold></td>
<td valign="top" align="center">32.2%</td>
<td valign="top" align="center">32.2%</td>
</tr>
<tr>
<td valign="top" align="left"></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic><sup>&#x2217;</sup>Glimmer predicting only possible protein coding regions not annotating afterwards. In bold lettering the recommended software.</italic></attrib>
</table-wrap-foot>
</table-wrap>
</sec>
<sec><title>Genome Analysis: CRISPR, Prophages, cpG Islands and Origin of Replication</title>
<p>In 12T0050_FLI no CRISPR loci were identified with the CRISPR Recognition Tool version 1.1. The gene FTN_0757 of <italic>F. novicida</italic> showed significant sequence similarity to the CRISPR-CAS system protein Cas9 and one homologue was also found in 12T0050_FLI (1 258 283-1 260 798). In these 2515 nucleotides, 586 methylation sites are reported. Additional, 5 of the directly adjacent 5&#x2032; positions of this region are methylated. No prophage elements were identified using PHAST. Eighty-seven tandem repeats were identified with the Tandem Repeats finder. Eight unusual cpG island were predicted using EMBOSS and analyzed for methylation (<xref ref-type="bibr" rid="B67">Rice et al., 2000</xref>) (<bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM3">S2</xref></bold>).</p>
<p>The origin of replication was predicted in a region with 1071 bp located 100 bp proximal in 5&#x2032;-direction of 4 DnaA box sequences (similar to ttatccaca) with not more than one mismatch to the <italic>Escherichia coli</italic> DNA box. The origin of replication in <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> 12T0050_FLI was set accordingly. Two DNA boxes had the identical sequence tgtggataa and can be presented as a new DnaA box identifier in <italic>F. tularensis</italic> subsp. <italic>holarctica</italic>. It seems to be characteristic for all <italic>Francisella</italic> species according to Blastnt. All features were included in <bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>.</p>
</sec>
<sec><title>Base Modification Detection and Methylation Analysis</title>
<p>Methylation is pervasive in <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> isolate 12T0050_FLI. More than 150,000 methylation sites were detected of which 12&#x2013;40% were methylated. Most sites belong to the Type I Restriction Modification system that recognizes bipartite motifs and cleave at large distances from their binding sites or orphan methylases. Incomplete methylation is typical for most orphan methylases that are suspected to play a major role in regulation of prokaryotic gene expression. Here, the single molecule, real-time sequencing reads were used to map DNA modifications including N6-methyl-adenosine (m6A), N4-methyl-cytosine (m4C) and N5-methyl-cytosine (m5C), see <bold>Table <xref ref-type="table" rid="T3">3</xref></bold>.</p>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p>Methylated motifs detected in the strain <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050_FLI.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<th valign="top" align="left">Motif</th>
<th valign="top" align="center">Modified position</th>
<th valign="top" align="left">Type</th>
<th valign="top" align="center">% of motif detected</th>
<th valign="top" align="center">Number of motifs detected</th>
<th valign="top" align="center">Number of motifs in genome</th>
<th valign="top" align="center">Mean modification QV</th>
<th valign="top" align="center">Mean motif coverage</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">GGTYDKTGV</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">38.8%</td>
<td valign="top" align="center">123</td>
<td valign="top" align="center">317</td>
<td valign="top" align="center">41.68</td>
<td valign="top" align="center">58.33</td>
</tr>
<tr>
<td valign="top" align="left">ADGTACTA</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">m6A</td>
<td valign="top" align="center">37.01%</td>
<td valign="top" align="center">104</td>
<td valign="top" align="center">281</td>
<td valign="top" align="center">44.12</td>
<td valign="top" align="center">54.46</td>
</tr>
<tr>
<td valign="top" align="left">GNNNNVNH</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">29.61%</td>
<td valign="top" align="center">97737</td>
<td valign="top" align="center">330035</td>
<td valign="top" align="center">42.05</td>
<td valign="top" align="center">54.80</td>
</tr>
<tr>
<td valign="top" align="left">GBTBNRVGV</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">21.12%</td>
<td valign="top" align="center">814</td>
<td valign="top" align="center">3855</td>
<td valign="top" align="center">39.24</td>
<td valign="top" align="center">56.61</td>
</tr>
<tr>
<td valign="top" align="left">GSVVNNNG</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">20.28%</td>
<td valign="top" align="center">2841</td>
<td valign="top" align="center">14011</td>
<td valign="top" align="center">39.48</td>
<td valign="top" align="center">55.97</td>
</tr>
<tr>
<td valign="top" align="left">GNNNNTBH</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">16.28%</td>
<td valign="top" align="center">20400</td>
<td valign="top" align="center">125341</td>
<td valign="top" align="center">39.88</td>
<td valign="top" align="center">55.61</td>
</tr>
<tr>
<td valign="top" align="left">TNNBASYW</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">14.85%</td>
<td valign="top" align="center">5951</td>
<td valign="top" align="center">40077</td>
<td valign="top" align="center">41.31</td>
<td valign="top" align="center">55.58</td>
</tr>
<tr>
<td valign="top" align="left">VANDYAGYA</td>
<td valign="top" align="center">2</td>
<td valign="top" align="left">m6A</td>
<td valign="top" align="center">13.89%</td>
<td valign="top" align="center">527</td>
<td valign="top" align="center">3793</td>
<td valign="top" align="center">42.41</td>
<td valign="top" align="center">54.84</td>
</tr>
<tr>
<td valign="top" align="left">CNNNNRNW</td>
<td valign="top" align="center">1</td>
<td valign="top" align="left">Unknown</td>
<td valign="top" align="center">10.95%</td>
<td valign="top" align="center">24699</td>
<td valign="top" align="center">225647</td>
<td valign="top" align="center">40.82</td>
<td valign="top" align="center">56.15</td>
</tr>
<tr>
<td valign="top" align="left"></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<attrib><italic>A mean modification Quality Value (QV) refers to the level of confidence that a base is methylated. A QV of 30 or higher is considered significant. The mean coverage for all instances where this motif was detected as modified.</italic></attrib>
</table-wrap-foot>
</table-wrap>
</sec>
<sec><title>Comparative Genome Analysis and Visualization</title>
<p>The assembly of 12T0050_FLI represents the first high quality full genome sequence of an isolate with German origin. It shares the common Clade B.6 with the Swedish <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain FTNF-002-00, NC_009749. The finishing of the genome of 12T0050_FLI enabled a detailed comparison of genome architecture und gene content. The sequence reads of 12T0050 were mapped to NC_009749 (<xref ref-type="bibr" rid="B42">Kearse et al., 2012</xref>). The main part of variable SNPs between NC_009749 and 12T0050_FLI were in non-coding repeat regions. Only two insertions were in coding regions and resulted in reading frame changes: 73 bp in an aspartate alanine antiporter CDS (CYL81_01665) and one 16 bp insertion in an ISO630 family transposase CDS (CYL81_02715).</p>
</sec>
<sec><title>Phylogenetic Analysis</title>
<p>In the first step the inclusion into the tree of life was targeted. The classification into the phylogenetic tree of life is necessary to allow for an exact classification of new and unknown bacterial species. The phylogenetic analysis was performed in two steps. First, the taxonomic classification was performed by 16S rRNA analysis with MOLE-BLAST, as the most traditional tool of classification (<bold>Figure <xref ref-type="fig" rid="F2">2</xref></bold>). PhyloPhlAn includes a non-redundant database of 400 proteins generated from 3,737 genomes of all microbial taxa to assign microbial phylogeny and putative taxonomy. The software builds phylogenetic trees based on >4,600 aligned amino acid positions, mirroring thus more the changes in the protein sequence and thus functionality than on nucleotide acid changes that might be silent. PhyloPhlAn was able to measure the sequence diversity of all <italic>Francisella</italic> strains allowing even the resolution of the different clades (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). In a second step for closer epidemiological investigations MLST<sup>+</sup> and Parsnp analysis were compared (<bold>Figure <xref ref-type="fig" rid="F5">5</xref></bold>). MLST<sup>+</sup> was performed with SeqSphere, a multilocus sequence typing tool based on the core genome that was used as described (<xref ref-type="bibr" rid="B3">Antwerpen et al., 2015</xref>). Before the usage of Parsnp, a control of the ANI &#x2265; 97 % is recommended. In the sample group the ANI was between 99.90% (12T0050_FLI/NC_017463) and 99.99% (12T0050_FLI/NC_009749). A deeper analysis was possible with the open source program Parsnp for core genome alignment and SNP detection as part of the Harvest suite in standard settings (<xref ref-type="bibr" rid="B91">Treangen et al., 2014</xref>). Common genes distributed across the chromosomes of all genomes analyzed represent the chromosomal core. The MUM segments, representing the core genome to derive SNPs spanned 1.3 Mb. A maximum likelihood tree with the GTRGAMMA model rate of heterogeneity was calculated with RaxML (<xref ref-type="bibr" rid="B83">Stamatakis, 2014</xref>) and supported by a bootstrapping test with 500 resamples. Phylogenomic analyses performed in a maximum likelihood (ML) framework using variable coding positions unambiguously identified 137 positions in all genomes for chromosomal sequences. Despite the reduced size of these data sets, unique SNPs were observed for all strains.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Phylogeny based on 16S rRNA performed with MOLE-BLAST.</p></caption>
<graphic xlink:href="fmicb-09-00344-g002.tif"/>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>PhyloPhlAn analysis of all <italic>Francisella</italic> isolates using amino acid sequences of more than 400 proteins. The graphic scale equals 2.0 amino acid differences in the overview <bold>(A)</bold> and in the detailed view with <italic>F. tularensis</italic> subsp. <italic>holarctica</italic>, the graphic scale equals 0.001 amino acid difference <bold>(B)</bold>.</p></caption>
<graphic xlink:href="fmicb-09-00344-g003.tif"/>
</fig>
<p>Maximum likelihood trees derived from the analysis of chromosomal sequences strongly supported the existence of the three clades B.4, B.6 and B.12. However, the number of SNPs will probably increase with larger numbers of available isolates and sequences of whole genomes. 12T0050 was separated from the reference strain by 17 SNPs to the B.6 strain, 629 to the B.12 strain and 648 to the B.4 strain. A <italic>R</italic><sup>2</sup> = 1,89 <sup>&#x2217;</sup> E-2 value, less than 0.5, suggesting weak clock-like behavior. The regression slope (rate) included negative values.</p>
</sec>
</sec>
<sec><title>Discussion</title>
<p>The sequenced genome 12T0050_FLI enabled a detailed analysis of genome architecture and gene content with bioinformatics tools. Pacific Biosciences DNA sequencing platforms generate long reads that can produce complete genome assemblies, but the sequencing is expensive and error-prone. The Illumina DNA sequencing platform generates accurate but short reads. There is significant interest in combining data from these complementary sequencing technologies to generate more accurate &#x201C;hybrid&#x201D; assemblies. Thus, we produced here a hybrid assembly of those two sequencing technologies for an optimal genome with the name 12T0050_FLI. The analysis resulted in a single contig of 1890609 bp and with that a slightly smaller genome than published genome sequences NC_017463 (1895727 bp) or NC_009749 (1890909 bp). The genomic analysis included the comparison to the closest neighbor NC_009749, the identification of the origin of replication, CRISPR regions, prophage regions and the analysis of the methylome. With a two-step phylogenetic analysis we established a new whole genome analysis pipeline that allowed description of a phylogenetic analysis of isolates collected in a circumscribed area in Germany and to elucidate the epidemiological context.</p>
<p>Several genome sequences of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> are published but only a limited number of genomes has been fully assembled and annotated (<xref ref-type="bibr" rid="B49">Larsson et al., 2005</xref>, <xref ref-type="bibr" rid="B48">2009</xref>; <xref ref-type="bibr" rid="B11">Beckstrom-Sternberg et al., 2007</xref>; <xref ref-type="bibr" rid="B24">Chaudhuri et al., 2007</xref>; <xref ref-type="bibr" rid="B71">Rohmer et al., 2007</xref>; <xref ref-type="bibr" rid="B8">Barabote et al., 2009</xref>; <xref ref-type="bibr" rid="B21">Champion, 2011</xref>; <xref ref-type="bibr" rid="B55">Modise et al., 2012</xref>; <xref ref-type="bibr" rid="B82">Sjodin et al., 2012</xref>; <xref ref-type="bibr" rid="B86">Svensson et al., 2012</xref>; <xref ref-type="bibr" rid="B4">Antwerpen et al., 2013</xref>, <xref ref-type="bibr" rid="B3">2015</xref>; <xref ref-type="bibr" rid="B5">Atkins et al., 2015</xref>; <xref ref-type="bibr" rid="B16">Busch et al., 2017</xref>). The here described assembly is a high quality full genome sequence. It is closely related to the Swedish <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain FTNF-002-00, NC_009749 Clade B.6. The genomic sequence 12T0050_FLI was mapped to NC_009749 (<xref ref-type="bibr" rid="B42">Kearse et al., 2012</xref>) and 77 SNPs could be called. Most divergent SNPs between NC_009749 and 12T0050_FLI were in non-coding repetitive regions and might be sequencing or assembly errors. Two insertions were in coding regions and resulted in reading frame changes: 73 bp in an aspartate alanine antiporter CDS and a 16 bp insertion in an ISO 630 family transposase CDS both of hitherto unknown effect on the phenotype.</p>
<p>CRISPR elements in bacteria confer protection against bacteriophages; approximately 40% of the bacterial genomes are known to carry CRISPR elements (<xref ref-type="bibr" rid="B10">Barrangou et al., 2007</xref>). In 12T0050_FLI no CRISPR loci were <italic>in silico</italic> detected. A CRISPR/Cas9 system has been reported for <italic>F. novicida</italic> (<xref ref-type="bibr" rid="B75">Sampson et al., 2013</xref>) and also from other <italic>Francisella</italic> strains, but these systems seem to be non-functional (<xref ref-type="bibr" rid="B77">Schunder et al., 2013</xref>). Especially the gene FTN_0757 was found to have sequence similarity to the CRISPR-CAS system protein Cas9 (<xref ref-type="bibr" rid="B75">Sampson et al., 2013</xref>). One homologue has also been found in 12T0050_FLI and is extensively methylated (23 %) (CYL81_06580). This coincidence might have major impact on endogenous gene regulation, ultimately promoting both, pathogenesis and commensalism.</p>
<p>Phage therapy is a potential alternative to the use of antibiotics in the up-coming era of drug-resistant pathogens. Especially because of the highly infectious nature of <italic>F. tularensis</italic>, phages might be one of the potential replacement options for antibiotics. Occasionally, phages are also involved in the lateral transfer of mobile DNA elements or bacterial DNA (<xref ref-type="bibr" rid="B18">Canchaya et al., 2003</xref>; <xref ref-type="bibr" rid="B34">Golkar et al., 2014</xref>). That would be of utmost importance because of the few differences that distinguish the highly virulent form of <italic>F. tularensis</italic> subsp. <italic>tularensis</italic> from <italic>F. tularensis</italic> subsp. <italic>holarctica</italic>. However, no prophage elements were identified using PHAST, indicating that <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> does not host viral infections. That minimizes the alternatives for antibiotics in form of phage therapy, but also the risks of lateral gene transfer. Fortunately, naturally occurring <italic>F. tularensis</italic> strains can be treated with several antibiotics and no tendency to increased resistance has been observed (<xref ref-type="bibr" rid="B89">Tomaso et al., 2017</xref>).</p>
<p>The delineated origin of replication, the oriC, appears to be characteristic and unique for <italic>F. tularensis</italic> in general. The origin of replication was predicted in a region of approximately 100 bp upstream in 5&#x2032;-direction of 4 DnaA box sequences. Three methods, based on DNA asymmetry, the distribution of DnaA boxes and dnaA gene location, were applied to identify the putative replication origins in single replication origin (oriC) in the genome of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050_FLI (<xref ref-type="bibr" rid="B51">Mackiewicz et al., 2004</xref>). Marker genes commonly observed near the bacterial origin of replication were found near the oriC region (chromosomal replication initiator protein DnaA CDS (CYL81_00005), priA gene (CYL81_009610), recA (CYL81_00060). Two probable DNA-unwinding element (DUE) sites were identified within the shorter oriC region based on its higher A/T composition. Two DNA boxes have the identical sequence TGTGGATAA and can be presented as new DnaA box identifier in <italic>F. tularensis</italic> subsp. <italic>holarctica</italic>. Also both DNA boxes were predicted to be highly methylated at the motif GNNNVNH from hitherto unknown DNA-methyltransferase. This motif is similar to known 6mA methylation motifs such as tttAynnnnngtg from <italic>Clostridium perfringens</italic> or cyayyyyyyctc from <italic>Geopsychrobacter electrophilus</italic>. DNA-methylation without a restriction enzyme is quite common and conserved methylation patterns are evolutionary stable playing an important role in genome replication regulation (<xref ref-type="bibr" rid="B14">Blow et al., 2016</xref>). The organisms with the highest local similarity between sequences are <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> and <italic>F. tularensis</italic> subsp. <italic>tularensis</italic> as detected by megablast, (<xref ref-type="bibr" rid="B57">Morgulis et al., 2008</xref>). The species with the next most similar sequences are <italic>Gilliamella apicola</italic> and <italic>Vibrio anguillarum</italic>, both belonging to the Gammaproteobacteriacea and are isolated from in bee and fish with coverage of only 8&#x2013;17% of the regions and approximately 80% identity. This analysis provides insight into the high conservation of this region. This oriC is unique for the whole <italic>F. tularensis</italic> group. Also two probable DNA unwinding regions that are A/T rich could be identified in the oriC region (see also GC-skew in <bold>Figure <xref ref-type="fig" rid="F1">1</xref></bold>). The enrichment of methylated GATC motifs in the origin of replication indicates that DNA methylation may regulate genome replication in a manner similar to that seen in <italic>Escherichia coli</italic>. Interestingly, only the methylation motif VANDYAGYA could be also identified in the strain <italic>Enterococcus faecium</italic> isolate 2014-VREF-63 (Rebase (<xref ref-type="bibr" rid="B69">Roberts et al., 2015</xref>)).</p>
<p>In highly clonal species that share the bulk of their genomes (>95%), such as <italic>Francisella</italic>, subtle changes, especially those that may alter gene expression such as for example methylation, are likely to have a significant effect on the pathogen&#x2019;s biology (<xref ref-type="bibr" rid="B21">Champion, 2011</xref>). The methylation of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> might also play a key role in the pathogenic stealth mechanisms of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> in macrophages. We found that methylation is pervasive in <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050_FLI as in most bacterial species. In total, 9 methylated motifs were identified being in the normal range of motifs compared to 0&#x2013;19 methylated motifs per organism in 230 other prokaryotes (<xref ref-type="bibr" rid="B14">Blow et al., 2016</xref>). Of these motifs 10&#x2013;39% where methylated. The predominant base modification type detected was m6A in 2 cases; all others could not be identified. The identification of m6A methylated motifs is consistent with the high abundance of this modification type in the databases. They are also of special interest because m6A are known epigenetic signals for DNA-protein interactions (<xref ref-type="bibr" rid="B97">Wion and Casadesus, 2006</xref>). The other modifications, especially m5C, might be underestimated due to the lower sensitivity of SMRT sequencing to these modifications. At least two methyltransferases (MTases) are predicted to be able to perform m6A methylation. The predicted methylation sites are higher methylated, but in most of them no known proteins were annotated. Most methylation sites belong to the Type I restriction modification system that recognizes bipartite motifs and cleave at large distances from their binding sites or orphan methylases. Incomplete methylation is typical for most orphan methylases that are suspected to play a major role in regulation of prokaryotic gene expression. This might indicate a methylation based prokaryotic gene expression in <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> being evolutionary older than the assumed defense function of the restriction modification systems and which could be a reason for the genomic structure of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> (<xref ref-type="bibr" rid="B14">Blow et al., 2016</xref>). In <italic>Escherichia coli</italic> the chromosome replication and nucleotide degradation is dependent on the methylation status of 11 GATC sites near the origin of replication (<italic>oriC</italic>), whereas hemimethylated origin sites are inactive. In <italic>Salmonella</italic>, a close relative of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> and belonging also to the Gammaproteobacteriacea, the key control in pathogenic virulence is the regulation of virulence genes by methylation of a DAM methylase.</p>
<p>CpG island prediction was performed with standard settings of EMBOSS (<xref ref-type="bibr" rid="B67">Rice et al., 2000</xref>), resulting in 8 cpG islands of unusual CG composition. Additional to the methylation pattern the cpG islands were analyzed. Eukaryotic DNA methylation is known to be specific for cytosines in cpG sequences. However, the protective function of DNA methylation is similar in eukaryotes and prokaryotes and it is proposed that cpG islands are associated with promoters that influence DNA replication and other functionalities (<xref ref-type="bibr" rid="B2">Antequera and Bird, 1999</xref>). Depending on the repetitive sequence, methylation can significantly enhance or reduce its genetic stability (<xref ref-type="bibr" rid="B61">Nichol and Pearson, 2002</xref>). Bacterial DNA from <italic>F. tularensis</italic> (LVS) containing unmethylated CpG Motifs triggers an activation of B-cells but no activation was triggered, when the DNA was methylated (<xref ref-type="bibr" rid="B31">Elkins et al., 1999</xref>). Eight unusual cpG island were predicted using EMBOSS (<xref ref-type="bibr" rid="B67">Rice et al., 2000</xref>) (see <bold>Supplementary Table <xref ref-type="supplementary-material" rid="SM3">S2</xref></bold>). The high methylation hints at a regulation which has to be explored by functional analysis. This regulative mechanism might help to evaluate the pathogenic pathways of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050 (<xref ref-type="bibr" rid="B31">Elkins et al., 1999</xref>).</p>
<p>To assess the phylogenetic origin of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050 we investigated 14 strains of the collection at the Friedrich-Loeffler-Institut. They were collected in the years 2009&#x2013;2015 in North Rhine-Westphalia, Germany, in the same region as isolate 12T0050 and were found up to 200 km apart. Whole genome sequencing with short sequences was performed. <italic>Francisella</italic> has a very difficult to assemble genome containing a repeat size of greater than 7 kbp (Class III) (<xref ref-type="bibr" rid="B45">Koren et al., 2013</xref>). Especially, the <italic>Francisella</italic> Pathogenicity Island that is reported to be duplicated in all the subspecies of <italic>F. tularensis</italic> (<italic>F. tularensis</italic> subsp. <italic>holarctica</italic>, <italic>tularensis</italic>, and <italic>mediasiatica</italic>) but is present using a single copy in <italic>F. novicida</italic> and <italic>F. philomiragia</italic> (<xref ref-type="bibr" rid="B15">Broms et al., 2010</xref>), is assembled into one contig using short sequence assemblers. With 12T0050_FLI, we were able to determine the currently best short-read assembly and annotation software. Although quality trimming and preprocessing with sickle was reported to reduce the transposon related artifacts as in Nextera XT kits from Illumina, in the preprocessing these seem to have only minor effects on the data set used here. Also bbduk, which is a tool for quality trimming and preprocessing, showed only minor effect. SPAdes in the Bayes Hammer mode without any further preprocessing was the method of choice for sequencer platforms. It is known that raw sequencing files contain contaminations (<xref ref-type="bibr" rid="B58">Mukherjee et al., 2015</xref>). A quality improvement was generated by excluding contigs that were smaller than 500 bp or with coverage lower than 3. Kraken analysis that was included into the workflow as a control for contamination and the analysis of the excluded contigs showed indeed a high percentage of contaminated sequences. The classification into the tree of life allows newly sequenced and unknown species to be classified correctly as was shown recently for new <italic>Francisella</italic> species (<xref ref-type="bibr" rid="B74">Rydzewski et al., 2014</xref>). Four protein annotation software were compared for analyzing the coding DNA sequences (CDS). The Prokka pipeline provided fast, easy and robust handling and could be easily curated with Artemis (<xref ref-type="bibr" rid="B19">Carver et al., 2012</xref>). The annotated content of 10 rRNA is the same as the previously published data of the complete genomes NC_007880 (LVS) and NC_008369 (OSU18), and is more reliable than the often misassembled rRNA annotations in short read assemblies. Thus, after SPAdes assembly, contig filtering and Kraken analysis, the Prokka annotation could easily be included. This pipeline was used as a uniform protocol for the here treated data. This was followed by phylogenetic analysis, starting with MOLE-BLAST and PhyloPhlAn to allow a classification into the phylogenetic tree of life and followed by closer epidemiological investigations using MLST<sup>+</sup> and Parsnp analysis.</p>
<p>To benchmark our whole genome comparisons with the prior literature, a phylogeny based on 16S rRNA gene sequences, historically the most frequently applied phylogenetic marker was generated with MOLE-BLAST (<xref ref-type="bibr" rid="B1">Altschul et al., 1997</xref>) that relies on the curated, updated and comprehensive database of NCBI. Thus, generated phylogenies allow newly sequenced organisms to be included in the tree of life using a broad data basis, as could be shown here in a tree including our dataset (<bold>Figure <xref ref-type="fig" rid="F3">3</xref></bold>). The coding sequences for the 16S rRNA could be extracted with geneious (<xref ref-type="bibr" rid="B42">Kearse et al., 2012</xref>) or MOLE-BLAST, which could be used with the assembled files. This consistently revealed only few differences between the <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strains and clustered together all of our strains into the <italic>Francisella</italic> group. The 16S rRNA phylogeny allowed us a simple and fast classification to the genus, species, and subspecies level (data in <bold>Table <xref ref-type="table" rid="T1">1</xref></bold> and <xref ref-type="bibr" rid="B89">Tomaso et al., 2017</xref>).</p>
<p>For more profound characterization, we utilized PhyloPhlAn, which is a software tool for accurately determining taxonomic identities and evolutionary relationships of novel microbial genomes (<xref ref-type="bibr" rid="B79">Segata et al., 2013</xref>). Results from PhyloPhlAn are based on substantially more data compared to 16S rRNA or even the MLST<sup>+</sup> approach presented in <bold>Figure <xref ref-type="fig" rid="F4">4</xref></bold>. The program determines the protein sequence diversity and improves consistency between phylogenetic and taxonomic groupings. PhyloPhlAn achieves taxonomic levels of high precision from phyla to species level but also reflects a substantial number of provisional clades, as could be shown also here in the genus of <italic>Francisella</italic>. PhyloPhlAn was able to define distinct genotypes for <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> for representatives of all major subclades, B.4, B.6, and B.12, respectively. The results of MOLE-BLAST and PhyloPhlAn are in good concordance with the data from MALDI-TOF and PCR and with all the results of conventional typing methods.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>MLST<sup>+</sup> of the strains showing the distance based on 1147 core genome MLST loci generated with SeqSphere. The graphic scale equals 0.1 difference of a MLST locus. Red colored isolate numbers indicate assignment to clade B.6, blue to clade B.12. The arrow marks the position of 12T0050.</p></caption>
<graphic xlink:href="fmicb-09-00344-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Neighbor-Joining Phylogenetic Tree of the ParSNP core genome SNP analysis <bold>(A)</bold>. The trees were statistically evaluated with RaXML with a bootstrap analysis with 500 bootstraps. (<bold>B</bold> and detailed view <bold>C</bold>, compared to canSNPer analysis)</p></caption>
<graphic xlink:href="fmicb-09-00344-g005.tif"/>
</fig>
<p>To perform a more detailed epidemiological analysis the core genome based MLST<sup>+</sup> method of SeqSphere (<xref ref-type="bibr" rid="B3">Antwerpen et al., 2015</xref>) and the core-genome multi-aligner Parsnp of the Harvest suite were compared (<xref ref-type="bibr" rid="B91">Treangen et al., 2014</xref>). Canonical single nucleotide polymorphisms (canSNPs) assays (qPCR and canSNPer) and MLST<sup>+</sup> distinct clusters of genotypes allowed to identify phylogeographic patterns of <italic>F. tularensis</italic> (<xref ref-type="bibr" rid="B65">Pilo et al., 2009</xref>; <xref ref-type="bibr" rid="B85">Svensson et al., 2009</xref>; <xref ref-type="bibr" rid="B94">Vogler et al., 2009</xref>, <xref ref-type="bibr" rid="B95">2011</xref>; <xref ref-type="bibr" rid="B23">Chanturia et al., 2011</xref>; <xref ref-type="bibr" rid="B36">Gyuranecz et al., 2012</xref>; <xref ref-type="bibr" rid="B41">Karlsson et al., 2013</xref>; <xref ref-type="bibr" rid="B3">Antwerpen et al., 2015</xref>).</p>
<p>The MLST<sup>+</sup> tree analysis is based on whole genome sequencing, core genome SNP calling, and defined 1147 MLST loci. The application of MLST<sup>+</sup> revealed two different genotypes with different degrees of relatedness among the investigated isolates. This was in line with laboratory qPCR data (see <bold>Table <xref ref-type="table" rid="T1">1</xref></bold>). Isolate 15T0016 was forming an outgroup. The assignment to genetic clades was nearly identical to results obtained with real-time PCR assays targeting canSNPs and INDELs, but no spatial and temporal clusters could be shown.</p>
<p>Finally, Parsnp analysis was performed. When using genomic variants for phylogenetic analysis, comparative genomics, or outbreak investigations, it is critical to properly evaluate the variant calling method and also to re-evaluate them on a regular basis (<xref ref-type="bibr" rid="B62">Olson et al., 2015</xref>). With a growing number of genome sequences the multiple alignments of homologous sequences followed by inference of a tree scale poorly. Therefore, independent &#x2018;alignment-free&#x2019; methods should be preferably used (<xref ref-type="bibr" rid="B22">Chan and Ragan, 2013</xref>). Parsnp combines the advantages of both, whole-genome alignment and read mapping. Parsnp scales to thousands of closely related genomes. To achieve this scalability, Parsnp is based on a suffix graph data structure for the rapid identification of maximal unique matches (MUMs), which serve as a common foundation to many pairwise and multiple genome alignment tools (<xref ref-type="bibr" rid="B91">Treangen et al., 2014</xref>). Following the Harvest suite for rapid core-genome alignment was used. For alignment a maximum likelihood tree with the GTRGAMMA model rate of heterogeneity was calculated with RaxML (<xref ref-type="bibr" rid="B83">Stamatakis, 2014</xref>) and supported by a bootstrapping test with 500 resamples. This method provided the highest resolution and was mostly congruent with the qPCR and canSNPer result. The groups B.11, B.45, B.49, B.51, and B.64 were identified.</p>
<p>Here, only random temporal and spatial distribution patterns can be described due to the small sample number. But we could achieve a more detailed differentiation for example for the three strains 12T0062, 15T0013 and 15T0014. The fact that the strain 12T0062 clustered together with 15T003 und 15T0014 was interesting because the canSNPer clustered them together. This phylogenetic clustering will be more precise because more data points are included. The placement of isolate 12T0062 was allocated on a separate branch in the MLST<sup>+</sup> and the PhyloPhlAn trees, and had an older common ancestor in the Parsnp/RaxML tree, whereas it was assigned to a branch by the typing methods based on the canSNPer approach. Also the closer resolution of the strains 10T0193, 09T0179, 12T0050 and 10T0192 that cluster in the canSNPer and qPCR analysis in one cluster form in this analysis a much more diverse group.</p>
<p>There is a need for an automated approach based on whole genome sequencing data. The here described pipeline is independent of a reference genome and allows analysis on varying sampling sizes, thus meeting the need of phylogenomics. A bioinformatics pipeline consisting of SPAdes, Prokka, PhyloPhlAn and Parsnp was here evaluated. While the study contains relatively few strains taken from a small area it bears the powerful option to directly broaden the impact by inclusion of data from other countries. It also opens up the option to consider host specific differences. This higher resolution can result in a more detailed view of epidemiology, including the phylogenetic aspect. The broader data basis for our placements compared to the canSNPer or MLST<sup>+</sup> models allows reclassifying diverged clades by high-resolution protein sequence analysis and more nucleotide sequence variations. An advantage of the here described pipeline approach is congruent with the qPCR approach but leads to a higher resolution. Thus, for future rapid routine whole genome sequencing can be used. When used with more isolates it might be even possible to establish a higher spatial and temporal resolution and thus to generate a highly standardized nomenclature for subpopulations. Besides, with relatively minor genetic differences found in the genomic analysis of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> isolate 12T0050 is highly conserved among the collected strains. <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strains investigated here showed only very low genetic evolution in the observation period. This is especially evident with a sequence comparison to NC_009749 that had been isolated more than 20 years ago (1997) and is geographical more than 1000 km away. To assess the evolution of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> we calculated the rates of molecular evolution that are the product of the number of mutations that arise per replication event, the frequency of replication events per unit time and the probability of mutational fixation (<xref ref-type="bibr" rid="B29">Duchene et al., 2016</xref>). The regression slope (rate) found here included negative values, suggesting that these rates are either too low or not enough with the here used data set to allow reliable rate estimation (data not shown). Similar data are obtained from <italic>Mycobacterium leprae</italic> relying on a set displaying moderate to strong temporal signal (<xref ref-type="bibr" rid="B29">Duchene et al., 2016</xref>). This indicates that <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> is a highly specialized and successful pathogen whose evolution might have reached a dead end such as in <italic>Clostridium chauvoei</italic> (<xref ref-type="bibr" rid="B73">Rychener et al., 2017</xref>). Genomics of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain 12T0050 and comparative genomics with other <italic>Francisella</italic> show a remarkable similarity in gene content despite the ecological and phenotypic diversity.</p>
</sec>
<sec><title>Conclusion</title>
<p>Here we introduce a high quality sequence of a <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> strain. This genome represents a unique oriC sequence, interesting Cas9 regions, and prophage regions and so far unknown methylation pattern. Additionally, we evaluated and established an analysis pipeline for <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> in Germany. We performed phylogenetic analysis on different levels, thereby linking existing 16S rRNA data with PhyloPhlAn and core genome SNP analysis with MLST<sup>+</sup> and Parsnp. These methods to assign microbial phylogeny and putative taxonomy using proteins (PhyloPhlAn) and SNPs (Parsnp) proved to be versatile in the epidemiological assessment of <italic>F. tularensis</italic> subsp. <italic>holarctica</italic> in North Rhine-Westphalia, Germany. A diagnostic whole genome sequencing pipeline was established and evaluated. This novel analysis allows a detailed classification, a very precise placement and the utilization of readily available whole genome data, independent of databases and reference genomes.</p>
</sec>
<sec><title>Author Contributions</title>
<p>HT has conceived the study, provided strains, strain information, and metadata to the samples. AB performed bioinformatics analysis of genomes, assembly and phylogenetic relationship. PT took part in the phylogenetic relationship analysis. PT and EZ provided bioinformatics, informatics support and data management. MP provided isolates and geographic information. HB, KN, and JG provided knowledgeable discussion and inclusion on bioinformatics pipelines within the framework of the project Ess-B.A.R. HT, SAD, HH, and HN took part in the study design and project discussion.</p>
</sec>
<sec><title>Conflict of Interest Statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> For this work AB was supported by a grant of the German Federal Ministry of Education and Research and was done within the framework of the project Ess-B.A.R. (FKZ 13N13983), as was HB (FKZ 13N13982), JG (FKZ 13N13982), and KN (FKZ 13N13984). PT was supported by ICAR International Fellowship. EZ was supported by a grant of the Friedrich-Loeffler-Institut, Antimicrobial Resistance&#x2013;Research Network T3 (HJ-002).</p>
</fn>
</fn-group>
<ack>
<p>We thank Kerstin Cerncic and Anja Hackbart for skillful technical assistance. We thank Robert Greither and Alessandro Albiero of Thermo Fisher Scientific for Ion Torrent sequencing and primary data analysis. We are also very grateful to Boyke Bunk for supplying the bioinformatics tool for sequence error correction of the hybrid assembly. Last but not least, we are immensely grateful to all people that provided samples and isolates.</p>
</ack>
<sec sec-type="supplementary material">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmicb.2018.00344/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmicb.2018.00344/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Presentation_1.pptx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.presentationml.presentation" xmlns:xlink="http://www.w3.org/1999/xlink">
<p><bold>FIGURE S1 &#x007C;</bold> Bioinformatics pipeline.</p>
</supplementary-material>
<supplementary-material xlink:href="Table_1.docx" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink">
<p><bold>TABLE S1 &#x007C;</bold> Comparison of assembler preprocessing with bbduk and sickle and assembler comparison of the 12T0050 assembly with SPAdes, AByss, MaSuRCA and CLC.</p>
</supplementary-material>
<supplementary-material xlink:href="Table_2.docx" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink">
<p><bold>TABLE S2 &#x007C;</bold> Predicted CpG island with number of methylated sides and percentage CpG island prediction with standard settings of EMBOSS, with an average methylation percentage between 12&#x2013;40% the predicted methylation sides are significantly methylated, but for most of them no known proteins were annotated.</p>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Altschul</surname> <given-names>S. F.</given-names></name> <name><surname>Madden</surname> <given-names>T. L.</given-names></name> <name><surname>Sch&#x00E4;ffer</surname> <given-names>A. A.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>Z.</given-names></name> <name><surname>Miller</surname> <given-names>W.</given-names></name></person-group> (<year>1997</year>). <article-title>Gapped BLAST and PSI-BLAST: a new generation of protein database search programs.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>25</volume> <fpage>3389</fpage>&#x2013;<lpage>3402</lpage>. <pub-id pub-id-type="doi">10.1093/nar/25.17.3389</pub-id> <pub-id pub-id-type="pmid">9254694</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Antequera</surname> <given-names>F.</given-names></name> <name><surname>Bird</surname> <given-names>A.</given-names></name></person-group> (<year>1999</year>). <article-title>CpG islands as genomic footprints of promoters that are associated with replication origins.</article-title> <source><italic>Curr. Biol.</italic></source> <volume>9</volume> <fpage>R661</fpage>&#x2013;<lpage>R667</lpage>. <pub-id pub-id-type="doi">10.1016/S0960-9822(99)80418-7</pub-id> <pub-id pub-id-type="pmid">10508580</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Antwerpen</surname> <given-names>M. H.</given-names></name> <name><surname>Prior</surname> <given-names>K.</given-names></name> <name><surname>Mellmann</surname> <given-names>A.</given-names></name> <name><surname>Hoppner</surname> <given-names>S.</given-names></name> <name><surname>Splettstoesser</surname> <given-names>W. D.</given-names></name> <name><surname>Harmsen</surname> <given-names>D.</given-names></name></person-group> (<year>2015</year>). <article-title>Rapid high resolution genotyping of <italic>Francisella tularensis</italic> by whole genome sequence comparison of annotated genes (&#x201C;MLST<sup>+</sup>&#x201D;).</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<issue>e0123298</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0123298</pub-id> <pub-id pub-id-type="pmid">25856198</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Antwerpen</surname> <given-names>M. H.</given-names></name> <name><surname>Schacht</surname> <given-names>E.</given-names></name> <name><surname>Kaysser</surname> <given-names>P.</given-names></name> <name><surname>Splettstoesser</surname> <given-names>W. D.</given-names></name></person-group> (<year>2013</year>). <article-title>Complete genome sequence of a <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> strain from Germany causing lethal infection in common marmosets.</article-title> <source><italic>Genome Announc.</italic></source> <volume>1</volume>:<issue>e00135</issue>&#x2013;<issue>12</issue>. <pub-id pub-id-type="doi">10.1128/genomeA.00135-12</pub-id> <pub-id pub-id-type="pmid">23405342</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Atkins</surname> <given-names>L. M.</given-names></name> <name><surname>Holder</surname> <given-names>M. E.</given-names></name> <name><surname>Ajami</surname> <given-names>N. J.</given-names></name> <name><surname>Metcalf</surname> <given-names>G. A.</given-names></name> <name><surname>Weissenberger</surname> <given-names>G. M.</given-names></name> <name><surname>Wang</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>High-quality draft genome sequence of <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> strain OR96-0246.</article-title> <source><italic>Genome Announc.</italic></source> <volume>3</volume>:<issue>e00898</issue>&#x2013;<issue>15</issue>. <pub-id pub-id-type="doi">10.1128/genomeA.00898-15</pub-id> <pub-id pub-id-type="pmid">26272574</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aziz</surname> <given-names>R. K.</given-names></name> <name><surname>Bartels</surname> <given-names>D.</given-names></name> <name><surname>Best</surname> <given-names>A. A.</given-names></name> <name><surname>Dejongh</surname> <given-names>M.</given-names></name> <name><surname>Disz</surname> <given-names>T.</given-names></name> <name><surname>Edwards</surname> <given-names>R. A.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>The RAST Server: rapid annotations using subsystems technology.</article-title> <source><italic>BMC Genomics</italic></source> <volume>9</volume>:<issue>75</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-9-75</pub-id> <pub-id pub-id-type="pmid">18261238</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bankevich</surname> <given-names>A.</given-names></name> <name><surname>Nurk</surname> <given-names>S.</given-names></name> <name><surname>Antipov</surname> <given-names>D.</given-names></name> <name><surname>Gurevich</surname> <given-names>A. A.</given-names></name> <name><surname>Dvorkin</surname> <given-names>M.</given-names></name> <name><surname>Kulikov</surname> <given-names>A. S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>SPAdes: a new genome assembly algorithm and its applications to single-cell sequencing.</article-title> <source><italic>J. Comput. Biol.</italic></source> <volume>19</volume> <fpage>455</fpage>&#x2013;<lpage>477</lpage>. <pub-id pub-id-type="doi">10.1089/cmb.2012.0021</pub-id> <pub-id pub-id-type="pmid">22506599</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barabote</surname> <given-names>R. D.</given-names></name> <name><surname>Xie</surname> <given-names>G.</given-names></name> <name><surname>Brettin</surname> <given-names>T. S.</given-names></name> <name><surname>Hinrichs</surname> <given-names>S. H.</given-names></name> <name><surname>Fey</surname> <given-names>P. D.</given-names></name> <name><surname>Jay</surname> <given-names>J. J.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Complete genome sequence of <italic>Francisella tularensis</italic> subspecies <italic>holarctica</italic> FTNF002-00.</article-title> <source><italic>PLoS One</italic></source> <volume>4</volume>:<issue>e7041</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0007041</pub-id> <pub-id pub-id-type="pmid">19756146</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barker</surname> <given-names>J. R.</given-names></name> <name><surname>Chong</surname> <given-names>A.</given-names></name> <name><surname>Wehrly</surname> <given-names>T. D.</given-names></name> <name><surname>Yu</surname> <given-names>J. J.</given-names></name> <name><surname>Rodriguez</surname> <given-names>S. A.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>The <italic>Francisella tularensis</italic> pathogenicity island encodes a secretion system that is required for phagosome escape and virulence.</article-title> <source><italic>Mol. Microbiol.</italic></source> <volume>74</volume> <fpage>1459</fpage>&#x2013;<lpage>1470</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2958.2009.06947.x</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barrangou</surname> <given-names>R.</given-names></name> <name><surname>Fremaux</surname> <given-names>C.</given-names></name> <name><surname>Deveau</surname> <given-names>H.</given-names></name> <name><surname>Richards</surname> <given-names>M.</given-names></name> <name><surname>Boyaval</surname> <given-names>P.</given-names></name> <name><surname>Moineau</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>CRISPR provides acquired resistance against viruses in prokaryotes.</article-title> <source><italic>Science</italic></source> <volume>315</volume> <fpage>1709</fpage>&#x2013;<lpage>1712</lpage>. <pub-id pub-id-type="doi">10.1126/science.1138140</pub-id> <pub-id pub-id-type="pmid">17379808</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beckstrom-Sternberg</surname> <given-names>S. M.</given-names></name> <name><surname>Auerbach</surname> <given-names>R. K.</given-names></name> <name><surname>Godbole</surname> <given-names>S.</given-names></name> <name><surname>Pearson</surname> <given-names>J. V.</given-names></name> <name><surname>Beckstrom-Sternberg</surname> <given-names>J. S.</given-names></name> <name><surname>Deng</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Complete genomic characterization of a pathogenic A.II strain of <italic>Francisella tularensis</italic> subspecies <italic>tularensis</italic>.</article-title> <source><italic>PLoS One</italic></source> <volume>2</volume>:<issue>e947</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0000947</pub-id> <pub-id pub-id-type="pmid">17895988</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Benson</surname> <given-names>G.</given-names></name></person-group> (<year>1999</year>). <article-title>Tandem repeats finder: a program to analyze DNA sequences.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>27</volume> <fpage>573</fpage>&#x2013;<lpage>580</lpage>. <pub-id pub-id-type="doi">10.1093/nar/27.2.573</pub-id> <pub-id pub-id-type="pmid">9862982</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bland</surname> <given-names>C.</given-names></name> <name><surname>Ramsey</surname> <given-names>T. L.</given-names></name> <name><surname>Sabree</surname> <given-names>F.</given-names></name> <name><surname>Lowe</surname> <given-names>M.</given-names></name> <name><surname>Brown</surname> <given-names>K.</given-names></name> <name><surname>Kyrpides</surname> <given-names>N. C.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>CRISPR recognition tool (CRT): a tool for automatic detection of clustered regularly interspaced palindromic repeats.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>8</volume>:<issue>209</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-8-209</pub-id> <pub-id pub-id-type="pmid">17577412</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Blow</surname> <given-names>M. J.</given-names></name> <name><surname>Clark</surname> <given-names>T. A.</given-names></name> <name><surname>Daum</surname> <given-names>C. G.</given-names></name> <name><surname>Deutschbauer</surname> <given-names>A. M.</given-names></name> <name><surname>Fomenkov</surname> <given-names>A.</given-names></name> <name><surname>Fries</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>The epigenomic landscape of prokaryotes.</article-title> <source><italic>PLoS Genet.</italic></source> <volume>12</volume>:<issue>e1005854</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1005854</pub-id> <pub-id pub-id-type="pmid">27171000</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Broms</surname> <given-names>J. E.</given-names></name> <name><surname>Sjostedt</surname> <given-names>A.</given-names></name> <name><surname>Lavander</surname> <given-names>M.</given-names></name></person-group> (<year>2010</year>). <article-title>The role of the <italic>Francisella tularensis</italic> pathogenicity island in type VI secretion, intracellular survival, and modulation of host cell signaling.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>1</volume>:<issue>136</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2010.00136</pub-id> <pub-id pub-id-type="pmid">21687753</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Busch</surname> <given-names>A.</given-names></name> <name><surname>Thomas</surname> <given-names>P.</given-names></name> <name><surname>Myrtennas</surname> <given-names>K.</given-names></name> <name><surname>Forsman</surname> <given-names>M.</given-names></name> <name><surname>Braune</surname> <given-names>S.</given-names></name> <name><surname>Runge</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>High-quality draft genome sequence of <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> strain 08t0073 isolated from a Wild European Hare.</article-title> <source><italic>Genome Announc.</italic></source> <volume>5</volume>:<issue>e01577</issue>&#x2013;<issue>16</issue>. <pub-id pub-id-type="doi">10.1128/genomeA.01577-16</pub-id> <pub-id pub-id-type="pmid">28336603</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bushnell</surname> <given-names>B.</given-names></name></person-group> (<year>2017</year>). <source><italic>BBMap Software Package.</italic></source> Available at: <ext-link ext-link-type="uri" xlink:href="http://sourceforge.net/projects/bbmap/">http://sourceforge.net/projects/bbmap/</ext-link></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Canchaya</surname> <given-names>C.</given-names></name> <name><surname>Fournous</surname> <given-names>G.</given-names></name> <name><surname>Chibani-Chennoufi</surname> <given-names>S.</given-names></name> <name><surname>Dillmann</surname> <given-names>M. L.</given-names></name> <name><surname>Brussow</surname> <given-names>H.</given-names></name></person-group> (<year>2003</year>). <article-title>Phage as agents of lateral gene transfer.</article-title> <source><italic>Curr. Opin. Microbiol.</italic></source> <volume>6</volume> <fpage>417</fpage>&#x2013;<lpage>424</lpage>. <pub-id pub-id-type="doi">10.1016/S1369-5274(03)00086-9</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carver</surname> <given-names>T.</given-names></name> <name><surname>Harris</surname> <given-names>S. R.</given-names></name> <name><surname>Berriman</surname> <given-names>M.</given-names></name> <name><surname>Parkhill</surname> <given-names>J.</given-names></name> <name><surname>Mcquillan</surname> <given-names>J. A.</given-names></name></person-group> (<year>2012</year>). <article-title>Artemis: an integrated platform for visualization and analysis of high-throughput sequence-based experimental data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>28</volume> <fpage>464</fpage>&#x2013;<lpage>469</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btr703</pub-id> <pub-id pub-id-type="pmid">22199388</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carver</surname> <given-names>T.</given-names></name> <name><surname>Thomson</surname> <given-names>N.</given-names></name> <name><surname>Bleasby</surname> <given-names>A.</given-names></name> <name><surname>Berriman</surname> <given-names>M.</given-names></name> <name><surname>Parkhill</surname> <given-names>J.</given-names></name></person-group> (<year>2009</year>). <article-title>DNAPlotter: circular and linear interactive genome visualization.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>119</fpage>&#x2013;<lpage>120</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btn578</pub-id> <pub-id pub-id-type="pmid">18990721</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Champion</surname> <given-names>M. D.</given-names></name></person-group> (<year>2011</year>). <article-title>Host-pathogen o-methyltransferase similarity and its specific presence in highly virulent strains of <italic>Francisella tularensis</italic> suggests molecular mimicry.</article-title> <source><italic>PLoS One</italic></source> <volume>6</volume>:<issue>e20295</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0020295</pub-id> <pub-id pub-id-type="pmid">21637805</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chan</surname> <given-names>C. X.</given-names></name> <name><surname>Ragan</surname> <given-names>M. A.</given-names></name></person-group> (<year>2013</year>). <article-title>Next-generation phylogenomics.</article-title> <source><italic>Biol. Direct</italic></source> <volume>8</volume>:<issue>3</issue>. <pub-id pub-id-type="doi">10.1186/1745-6150-8-3</pub-id> <pub-id pub-id-type="pmid">23339707</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chanturia</surname> <given-names>G.</given-names></name> <name><surname>Birdsell</surname> <given-names>D. N.</given-names></name> <name><surname>Kekelidze</surname> <given-names>M.</given-names></name> <name><surname>Zhgenti</surname> <given-names>E.</given-names></name> <name><surname>Babuadze</surname> <given-names>G.</given-names></name> <name><surname>Tsertsvadze</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Phylogeography of <italic>Francisella tularensis</italic> subspecies <italic>holarctica</italic> from the country of Georgia.</article-title> <source><italic>BMC Microbiol.</italic></source> <volume>11</volume>:<issue>139</issue>. <pub-id pub-id-type="doi">10.1186/1471-2180-11-139</pub-id> <pub-id pub-id-type="pmid">21682874</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chaudhuri</surname> <given-names>R. R.</given-names></name> <name><surname>Ren</surname> <given-names>C. P.</given-names></name> <name><surname>Desmond</surname> <given-names>L.</given-names></name> <name><surname>Vincent</surname> <given-names>G. A.</given-names></name> <name><surname>Silman</surname> <given-names>N. J.</given-names></name> <name><surname>Brehm</surname> <given-names>J. K.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Genome sequencing shows that European isolates of <italic>Francisella tularensis</italic> subspecies <italic>tularensis</italic> are almost identical to US laboratory strain Schu S4.</article-title> <source><italic>PLoS One</italic></source> <volume>2</volume>:<issue>e352</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0000352</pub-id> <pub-id pub-id-type="pmid">17406676</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chin</surname> <given-names>C. S.</given-names></name> <name><surname>Alexander</surname> <given-names>D. H.</given-names></name> <name><surname>Marks</surname> <given-names>P.</given-names></name> <name><surname>Klammer</surname> <given-names>A. A.</given-names></name> <name><surname>Drake</surname> <given-names>J.</given-names></name> <name><surname>Heiner</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Nonhybrid, finished microbial genome assemblies from long-read SMRT sequencing data.</article-title> <source><italic>Nat. Methods</italic></source> <volume>10</volume> <fpage>563</fpage>&#x2013;<lpage>569</lpage>. <pub-id pub-id-type="doi">10.1038/nmeth.2474</pub-id> <pub-id pub-id-type="pmid">23644548</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>de Bruin</surname> <given-names>O. M.</given-names></name> <name><surname>Duplantis</surname> <given-names>B. N.</given-names></name> <name><surname>Ludu</surname> <given-names>J. S.</given-names></name> <name><surname>Hare</surname> <given-names>R. F.</given-names></name> <name><surname>Nix</surname> <given-names>E. B.</given-names></name> <name><surname>Schmerk</surname> <given-names>C. L.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>The biochemical properties of the <italic>Francisella</italic> pathogenicity island (FPI)-encoded proteins IglA, IglB, IglC, PdpB and DotU suggest roles in type VI secretion.</article-title> <source><italic>Microbiology</italic></source> <volume>157</volume> <fpage>3483</fpage>&#x2013;<lpage>3491</lpage>. <pub-id pub-id-type="doi">10.1099/mic.0.052308-0</pub-id> <pub-id pub-id-type="pmid">21980115</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Delcher</surname> <given-names>A. L.</given-names></name> <name><surname>Bratke</surname> <given-names>K. A.</given-names></name> <name><surname>Powers</surname> <given-names>E. C.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2007</year>). <article-title>Identifying bacterial genes and endosymbiont DNA with Glimmer.</article-title> <source><italic>Bioinformatics</italic></source> <volume>23</volume> <fpage>673</fpage>&#x2013;<lpage>679</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btm009</pub-id> <pub-id pub-id-type="pmid">17237039</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Delcher</surname> <given-names>A. L.</given-names></name> <name><surname>Harmon</surname> <given-names>D.</given-names></name> <name><surname>Kasif</surname> <given-names>S.</given-names></name> <name><surname>White</surname> <given-names>O.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>1999</year>). <article-title>Improved microbial gene identification with GLIMMER.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>27</volume> <fpage>4636</fpage>&#x2013;<lpage>4641</lpage>. <pub-id pub-id-type="doi">10.1093/nar/27.23.4636</pub-id> <pub-id pub-id-type="pmid">10556321</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Duchene</surname> <given-names>S.</given-names></name> <name><surname>Holt</surname> <given-names>K. E.</given-names></name> <name><surname>Weill</surname> <given-names>F. X.</given-names></name> <name><surname>Le Hello</surname> <given-names>S.</given-names></name> <name><surname>Hawkey</surname> <given-names>J.</given-names></name> <name><surname>Edwards</surname> <given-names>D. J.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Genome-scale rates of evolutionary change in bacteria.</article-title> <source><italic>Microb. Genomics</italic></source> <volume>2</volume>:<issue>e000094</issue>. <pub-id pub-id-type="doi">10.1099/mgen.0.000094</pub-id> <pub-id pub-id-type="pmid">28348834</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Edgar</surname> <given-names>R. C.</given-names></name></person-group> (<year>2004</year>). <article-title>MUSCLE: a multiple sequence alignment method with reduced time and space complexity.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>5</volume>:<issue>113</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-5-113</pub-id> <pub-id pub-id-type="pmid">15318951</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Elkins</surname> <given-names>K. L.</given-names></name> <name><surname>Rhinehart-Jones</surname> <given-names>T. R.</given-names></name> <name><surname>Stibitz</surname> <given-names>S.</given-names></name> <name><surname>Conover</surname> <given-names>J. S.</given-names></name> <name><surname>Klinman</surname> <given-names>D. M.</given-names></name></person-group> (<year>1999</year>). <article-title>Bacterial DNA containing CpG motifs stimulates lymphocyte-dependent protection of mice against lethal infection with intracellular bacteria.</article-title> <source><italic>J. Immunol.</italic></source> <volume>162</volume> <fpage>2291</fpage>&#x2013;<lpage>2298</lpage>. <pub-id pub-id-type="pmid">9973506</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ellis</surname> <given-names>J.</given-names></name> <name><surname>Oyston</surname> <given-names>P. C.</given-names></name> <name><surname>Green</surname> <given-names>M.</given-names></name> <name><surname>Titball</surname> <given-names>R. W.</given-names></name></person-group> (<year>2002</year>). <article-title>Tularemia.</article-title> <source><italic>Clin. Microbiol. Rev.</italic></source> <volume>15</volume> <fpage>631</fpage>&#x2013;<lpage>646</lpage>. <pub-id pub-id-type="doi">10.1128/CMR.15.4.631-646.2002</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>F.</given-names></name> <name><surname>Zhang</surname> <given-names>C. T.</given-names></name></person-group> (<year>2008</year>). <article-title>Ori-Finder: a web-based system for finding oriCs in unannotated bacterial genomes.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>9</volume>:<issue>79</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-9-79</pub-id> <pub-id pub-id-type="pmid">18237442</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Golkar</surname> <given-names>Z.</given-names></name> <name><surname>Bagasra</surname> <given-names>O.</given-names></name> <name><surname>Pace</surname> <given-names>D. G.</given-names></name></person-group> (<year>2014</year>). <article-title>Bacteriophage therapy: a potential solution for the antibiotic resistance crisis.</article-title> <source><italic>J. Infect. Dev. Ctries.</italic></source> <volume>8</volume> <fpage>129</fpage>&#x2013;<lpage>136</lpage>. <pub-id pub-id-type="doi">10.3855/jidc.3573</pub-id> <pub-id pub-id-type="pmid">24518621</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gurevich</surname> <given-names>A.</given-names></name> <name><surname>Saveliev</surname> <given-names>V.</given-names></name> <name><surname>Vyahhi</surname> <given-names>N.</given-names></name> <name><surname>Tesler</surname> <given-names>G.</given-names></name></person-group> (<year>2013</year>). <article-title>QUAST: quality assessment tool for genome assemblies.</article-title> <source><italic>Bioinformatics</italic></source> <volume>29</volume> <fpage>1072</fpage>&#x2013;<lpage>1075</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt086</pub-id> <pub-id pub-id-type="pmid">23422339</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gyuranecz</surname> <given-names>M.</given-names></name> <name><surname>Birdsell</surname> <given-names>D. N.</given-names></name> <name><surname>Splettstoesser</surname> <given-names>W.</given-names></name> <name><surname>Seibold</surname> <given-names>E.</given-names></name> <name><surname>Beckstrom-Sternberg</surname> <given-names>S. M.</given-names></name> <name><surname>Makrai</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Phylogeography of <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic>, Europe.</article-title> <source><italic>Emerg. Infect. Dis.</italic></source> <volume>18</volume> <fpage>290</fpage>&#x2013;<lpage>293</lpage>. <pub-id pub-id-type="doi">10.3201/eid1802.111305</pub-id> <pub-id pub-id-type="pmid">22305204</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hunt</surname> <given-names>M.</given-names></name> <name><surname>Silva</surname> <given-names>N. D.</given-names></name> <name><surname>Otto</surname> <given-names>T. D.</given-names></name> <name><surname>Parkhill</surname> <given-names>J.</given-names></name> <name><surname>Keane</surname> <given-names>J. A.</given-names></name> <name><surname>Harris</surname> <given-names>S. R.</given-names></name></person-group> (<year>2015</year>). <article-title>Circlator: automated circularization of genome assemblies using long sequencing reads.</article-title> <source><italic>Genome Biol.</italic></source> <volume>16</volume>:<issue>294</issue>. <pub-id pub-id-type="doi">10.1186/s13059-015-0849-0</pub-id> <pub-id pub-id-type="pmid">26714481</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huson</surname> <given-names>D. H.</given-names></name> <name><surname>Richter</surname> <given-names>D. C.</given-names></name> <name><surname>Rausch</surname> <given-names>C.</given-names></name> <name><surname>Dezulian</surname> <given-names>T.</given-names></name> <name><surname>Franz</surname> <given-names>M.</given-names></name> <name><surname>Rupp</surname> <given-names>R.</given-names></name></person-group> (<year>2007</year>). <article-title>Dendroscope: an interactive viewer for large phylogenetic trees.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>8</volume>:<issue>460</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-8-460</pub-id> <pub-id pub-id-type="pmid">18034891</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>B. D.</given-names></name> <name><surname>Faron</surname> <given-names>M.</given-names></name> <name><surname>Rasmussen</surname> <given-names>J. A.</given-names></name> <name><surname>Fletcher</surname> <given-names>J. R.</given-names></name></person-group> (<year>2014</year>). <article-title>Uncovering the components of the <italic>Francisella tularensis</italic> virulence stealth strategy.</article-title> <source><italic>Front. Cell. Infect. Microbiol.</italic></source> <volume>4</volume>:<issue>32</issue>. <pub-id pub-id-type="doi">10.3389/fcimb.2014.00032</pub-id> <pub-id pub-id-type="pmid">24639953</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jones</surname> <given-names>C. L.</given-names></name> <name><surname>Sampson</surname> <given-names>T. R.</given-names></name> <name><surname>Nakaya</surname> <given-names>H. I.</given-names></name> <name><surname>Pulendran</surname> <given-names>B.</given-names></name> <name><surname>Weiss</surname> <given-names>D. S.</given-names></name></person-group> (<year>2012</year>). <article-title>Repression of bacterial lipoprotein production by <italic>Francisella novicida</italic> facilitates evasion of innate immune recognition.</article-title> <source><italic>Cell. Microbiol.</italic></source> <volume>14</volume> <fpage>1531</fpage>&#x2013;<lpage>1543</lpage>. <pub-id pub-id-type="doi">10.1111/j.1462-5822.2012.01816.x</pub-id> <pub-id pub-id-type="pmid">22632124</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Karlsson</surname> <given-names>E.</given-names></name> <name><surname>Svensson</surname> <given-names>K.</given-names></name> <name><surname>Lindgren</surname> <given-names>P.</given-names></name> <name><surname>Bystrom</surname> <given-names>M.</given-names></name> <name><surname>Sjodin</surname> <given-names>A.</given-names></name> <name><surname>Forsman</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>The phylogeographic pattern of <italic>Francisella tularensis</italic> in Sweden indicates a Scandinavian origin of Eurosiberian tularaemia.</article-title> <source><italic>Environ. Microbiol.</italic></source> <volume>15</volume> <fpage>634</fpage>&#x2013;<lpage>645</lpage>. <pub-id pub-id-type="doi">10.1111/1462-2920.12052</pub-id> <pub-id pub-id-type="pmid">23253075</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kearse</surname> <given-names>M.</given-names></name> <name><surname>Moir</surname> <given-names>R.</given-names></name> <name><surname>Wilson</surname> <given-names>A.</given-names></name> <name><surname>Stones-Havas</surname> <given-names>S.</given-names></name> <name><surname>Cheung</surname> <given-names>M.</given-names></name> <name><surname>Sturrock</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Geneious Basic: an integrated and extendable desktop software platform for the organization and analysis of sequence data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>28</volume> <fpage>1647</fpage>&#x2013;<lpage>1649</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts199</pub-id> <pub-id pub-id-type="pmid">22543367</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kingry</surname> <given-names>L. C.</given-names></name> <name><surname>Petersen</surname> <given-names>J. M.</given-names></name></person-group> (<year>2014</year>). <article-title>Comparative review of <italic>Francisella tularensis</italic> and <italic>Francisella novicida</italic>.</article-title> <source><italic>Front. Cell. Infect. Microbiol.</italic></source> <volume>4</volume>:<issue>35</issue>. <pub-id pub-id-type="doi">10.3389/fcimb.2014.00035</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koboldt</surname> <given-names>D. C.</given-names></name> <name><surname>Chen</surname> <given-names>K.</given-names></name> <name><surname>Wylie</surname> <given-names>T.</given-names></name> <name><surname>Larson</surname> <given-names>D. E.</given-names></name> <name><surname>Mclellan</surname> <given-names>M. D.</given-names></name> <name><surname>Mardis</surname> <given-names>E. R.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>VarScan: variant detection in massively parallel sequencing of individual and pooled samples.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>2283</fpage>&#x2013;<lpage>2285</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp373</pub-id> <pub-id pub-id-type="pmid">19542151</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Koren</surname> <given-names>S.</given-names></name> <name><surname>Harhay</surname> <given-names>G. P.</given-names></name> <name><surname>Smith</surname> <given-names>T. P.</given-names></name> <name><surname>Bono</surname> <given-names>J. L.</given-names></name> <name><surname>Harhay</surname> <given-names>D. M.</given-names></name> <name><surname>Mcvey</surname> <given-names>S. D.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Reducing assembly complexity of microbial genomes with single-molecule sequencing.</article-title> <source><italic>Genome Biol.</italic></source> <volume>14</volume>:<issue>R101</issue>. <pub-id pub-id-type="doi">10.1186/gb-2013-14-9-r101</pub-id> <pub-id pub-id-type="pmid">24034426</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kumar</surname> <given-names>R.</given-names></name> <name><surname>Rao</surname> <given-names>D. N.</given-names></name></person-group> (<year>2013</year>). <article-title>Role of DNA methyltransferases in epigenetic regulation in bacteria.</article-title> <source><italic>Subcell. Biochem.</italic></source> <volume>61</volume> <fpage>81</fpage>&#x2013;<lpage>102</lpage>. <pub-id pub-id-type="doi">10.1007/978-94-007-4525-4_4</pub-id> <pub-id pub-id-type="pmid">23150247</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larkeryd</surname> <given-names>A.</given-names></name> <name><surname>Myrtennas</surname> <given-names>K.</given-names></name> <name><surname>Karlsson</surname> <given-names>E.</given-names></name> <name><surname>Dwibedi</surname> <given-names>C. K.</given-names></name> <name><surname>Forsman</surname> <given-names>M.</given-names></name> <name><surname>Larsson</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>CanSNPer: a hierarchical genotype classifier of clonal pathogens.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1762</fpage>&#x2013;<lpage>1764</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu113</pub-id> <pub-id pub-id-type="pmid">24574113</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larsson</surname> <given-names>P.</given-names></name> <name><surname>Elfsmark</surname> <given-names>D.</given-names></name> <name><surname>Svensson</surname> <given-names>K.</given-names></name> <name><surname>Wikstrom</surname> <given-names>P.</given-names></name> <name><surname>Forsman</surname> <given-names>M.</given-names></name> <name><surname>Brettin</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Molecular evolutionary consequences of niche restriction in <italic>Francisella tularensis</italic>, a facultative intracellular pathogen.</article-title> <source><italic>PLoS Pathog.</italic></source> <volume>5</volume>:<issue>e1000472</issue>. <pub-id pub-id-type="doi">10.1371/journal.ppat.1000472</pub-id> <pub-id pub-id-type="pmid">19521508</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Larsson</surname> <given-names>P.</given-names></name> <name><surname>Oyston</surname> <given-names>P. C.</given-names></name> <name><surname>Chain</surname> <given-names>P.</given-names></name> <name><surname>Chu</surname> <given-names>M. C.</given-names></name> <name><surname>Duffield</surname> <given-names>M.</given-names></name> <name><surname>Fuxelius</surname> <given-names>H. H.</given-names></name><etal/></person-group> (<year>2005</year>). <article-title>The complete genome sequence of <italic>Francisella tularensis</italic>, the causative agent of tularemia.</article-title> <source><italic>Nat. Genet.</italic></source> <volume>37</volume> <fpage>153</fpage>&#x2013;<lpage>159</lpage>. <pub-id pub-id-type="doi">10.1038/ng1499</pub-id> <pub-id pub-id-type="pmid">15640799</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Durbin</surname> <given-names>R.</given-names></name></person-group> (<year>2010</year>). <article-title>Fast and accurate long-read alignment with Burrows&#x2013;Wheeler transform.</article-title> <source><italic>Bioinformatics</italic></source> <volume>26</volume> <fpage>589</fpage>&#x2013;<lpage>595</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp698</pub-id> <pub-id pub-id-type="pmid">20080505</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mackiewicz</surname> <given-names>P.</given-names></name> <name><surname>Zakrzewska-Czerwinska</surname> <given-names>J.</given-names></name> <name><surname>Zawilak</surname> <given-names>A.</given-names></name> <name><surname>Dudek</surname> <given-names>M. R.</given-names></name> <name><surname>Cebrat</surname> <given-names>S.</given-names></name></person-group> (<year>2004</year>). <article-title>Where does bacterial replication start? Rules for predicting the oriC region.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>32</volume> <fpage>3781</fpage>&#x2013;<lpage>3791</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh699</pub-id> <pub-id pub-id-type="pmid">15258248</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maurin</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title><italic>Francisella tularensis</italic> as a potential agent of bioterrorism?</article-title> <source><italic>Expert Rev. Anti Infect. Ther.</italic></source> <volume>13</volume> <fpage>141</fpage>&#x2013;<lpage>144</lpage>. <pub-id pub-id-type="doi">10.1586/14787210.2015.986463</pub-id> <pub-id pub-id-type="pmid">25413334</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McCarthy</surname> <given-names>A.</given-names></name></person-group> (<year>2010</year>). <article-title>Third generation DNA sequencing: pacific biosciences&#x2019; single molecule real time technology.</article-title> <source><italic>Chem. Biol.</italic></source> <volume>17</volume> <fpage>675</fpage>&#x2013;<lpage>676</lpage>. <pub-id pub-id-type="doi">10.1016/j.chembiol.2010.07.004</pub-id> <pub-id pub-id-type="pmid">20659677</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meyer</surname> <given-names>F.</given-names></name> <name><surname>Paarmann</surname> <given-names>D.</given-names></name> <name><surname>D&#x2019;souza</surname> <given-names>M.</given-names></name> <name><surname>Olson</surname> <given-names>R.</given-names></name> <name><surname>Glass</surname> <given-names>E. M.</given-names></name> <name><surname>Kubal</surname> <given-names>M.</given-names></name></person-group> (<year>2008</year>). <article-title>The metagenomics RAST server - a public resource for the automatic phylogenetic and functional analysis of metagenomes.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>9</volume>:<issue>386</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-9-386</pub-id> <pub-id pub-id-type="pmid">18803844</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Modise</surname> <given-names>T.</given-names></name> <name><surname>Ryder</surname> <given-names>C.</given-names></name> <name><surname>Mane</surname> <given-names>S. P.</given-names></name> <name><surname>Bandara</surname> <given-names>A. B.</given-names></name> <name><surname>Jensen</surname> <given-names>R. V.</given-names></name> <name><surname>Inzana</surname> <given-names>T. J.</given-names></name></person-group> (<year>2012</year>). <article-title>Genomic comparison between a virulent type A1 strain of <italic>Francisella tularensis</italic> and its attenuated O-antigen mutant.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>194</volume> <fpage>2775</fpage>&#x2013;<lpage>2776</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00152-12</pub-id> <pub-id pub-id-type="pmid">22535949</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moinet</surname> <given-names>M.</given-names></name> <name><surname>Decors</surname> <given-names>A.</given-names></name> <name><surname>Mendy</surname> <given-names>C.</given-names></name> <name><surname>Faure</surname> <given-names>E.</given-names></name> <name><surname>Durand</surname> <given-names>B.</given-names></name> <name><surname>Madani</surname> <given-names>N.</given-names></name></person-group> (<year>2016</year>). <article-title>Spatio-temporal dynamics of tularemia in French wildlife: 2002-2013.</article-title> <source><italic>Prev. Vet. Med.</italic></source> <volume>130</volume> <fpage>33</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1016/j.prevetmed.2016.05.015</pub-id> <pub-id pub-id-type="pmid">27435644</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morgulis</surname> <given-names>A.</given-names></name> <name><surname>Coulouris</surname> <given-names>G.</given-names></name> <name><surname>Raytselis</surname> <given-names>Y.</given-names></name> <name><surname>Madden</surname> <given-names>T. L.</given-names></name> <name><surname>Agarwala</surname> <given-names>R.</given-names></name> <name><surname>Schaffer</surname> <given-names>A. A.</given-names></name></person-group> (<year>2008</year>). <article-title>Database indexing for production MegaBLAST searches.</article-title> <source><italic>Bioinformatics</italic></source> <volume>24</volume> <fpage>1757</fpage>&#x2013;<lpage>1764</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btn322</pub-id> <pub-id pub-id-type="pmid">18567917</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mukherjee</surname> <given-names>S.</given-names></name> <name><surname>Huntemann</surname> <given-names>M.</given-names></name> <name><surname>Ivanova</surname> <given-names>N.</given-names></name> <name><surname>Kyrpides</surname> <given-names>N. C.</given-names></name> <name><surname>Pati</surname> <given-names>A.</given-names></name></person-group> (<year>2015</year>). <article-title>Large-scale contamination of microbial isolate genomes by Illumina PhiX control.</article-title> <source><italic>Stand. Genomic Sci.</italic></source> <volume>10</volume>:<issue>18</issue>. <pub-id pub-id-type="doi">10.1186/1944-3277-10-18</pub-id> <pub-id pub-id-type="pmid">26203331</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>M&#x00FC;ller</surname> <given-names>W.</given-names></name> <name><surname>Hotzel</surname> <given-names>H.</given-names></name> <name><surname>Otto</surname> <given-names>P.</given-names></name> <name><surname>Karger</surname> <given-names>A.</given-names></name> <name><surname>Bettin</surname> <given-names>B.</given-names></name> <name><surname>Bocklisch</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>German <italic>Francisella tularensis</italic> isolates from European brown hares (<italic>Lepus europaeus</italic>) reveal genetic and phenotypic diversity.</article-title> <source><italic>BMC Microbiol.</italic></source> <volume>13</volume>:<issue>61</issue>. <pub-id pub-id-type="doi">10.1186/1471-2180-13-61</pub-id> <pub-id pub-id-type="pmid">23517149</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Murray</surname> <given-names>I. A.</given-names></name> <name><surname>Clark</surname> <given-names>T. A.</given-names></name> <name><surname>Morgan</surname> <given-names>R. D.</given-names></name> <name><surname>Boitano</surname> <given-names>M.</given-names></name> <name><surname>Anton</surname> <given-names>B. P.</given-names></name> <name><surname>Luong</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>The methylomes of six bacteria.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>40</volume> <fpage>11450</fpage>&#x2013;<lpage>11462</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gks891</pub-id> <pub-id pub-id-type="pmid">23034806</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nichol</surname> <given-names>K.</given-names></name> <name><surname>Pearson</surname> <given-names>C. E.</given-names></name></person-group> (<year>2002</year>). <article-title>CpG methylation modifies the genetic stability of cloned repeat sequences.</article-title> <source><italic>Genome Res.</italic></source> <volume>12</volume> <fpage>1246</fpage>&#x2013;<lpage>1256</lpage>. <pub-id pub-id-type="doi">10.1101/gr.74502</pub-id> <pub-id pub-id-type="pmid">12176932</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Olson</surname> <given-names>N. D.</given-names></name> <name><surname>Lund</surname> <given-names>S. P.</given-names></name> <name><surname>Colman</surname> <given-names>R. E.</given-names></name> <name><surname>Foster</surname> <given-names>J. T.</given-names></name> <name><surname>Sahl</surname> <given-names>J. W.</given-names></name> <name><surname>Schupp</surname> <given-names>J. M.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Best practices for evaluating single nucleotide variant calling methods for microbial genomics.</article-title> <source><italic>Front. Genet.</italic></source> <volume>6</volume>:<issue>235</issue>. <pub-id pub-id-type="doi">10.3389/fgene.2015.00235</pub-id> <pub-id pub-id-type="pmid">26217378</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Otto</surname> <given-names>P.</given-names></name> <name><surname>Kohlmann</surname> <given-names>R.</given-names></name> <name><surname>Muller</surname> <given-names>W.</given-names></name> <name><surname>Julich</surname> <given-names>S.</given-names></name> <name><surname>Geis</surname> <given-names>G.</given-names></name> <name><surname>Gatermann</surname> <given-names>S. G.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Hare-to-human transmission of <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic>, Germany.</article-title> <source><italic>Emerg. Infect. Dis.</italic></source> <volume>21</volume> <fpage>153</fpage>&#x2013;<lpage>155</lpage>. <pub-id pub-id-type="doi">10.3201/eid2101.131837</pub-id> <pub-id pub-id-type="pmid">25531286</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ozanic</surname> <given-names>M.</given-names></name> <name><surname>Marecic</surname> <given-names>V.</given-names></name> <name><surname>Abu Kwaik</surname> <given-names>Y.</given-names></name> <name><surname>Santic</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>The divergent intracellular lifestyle of <italic>Francisella tularensis</italic> in evolutionarily distinct host cells.</article-title> <source><italic>PLoS Pathog.</italic></source> <volume>11</volume>:<issue>e1005208</issue>. <pub-id pub-id-type="doi">10.1371/journal.ppat.1005208</pub-id> <pub-id pub-id-type="pmid">26633893</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pilo</surname> <given-names>P.</given-names></name> <name><surname>Johansson</surname> <given-names>A.</given-names></name> <name><surname>Frey</surname> <given-names>J.</given-names></name></person-group> (<year>2009</year>). <article-title>Identification of <italic>Francisella tularensis</italic> cluster in central and western Europe.</article-title> <source><italic>Emerg. Infect. Dis.</italic></source> <volume>15</volume> <fpage>2049</fpage>&#x2013;<lpage>2051</lpage>. <pub-id pub-id-type="doi">10.3201/eid1512.080805</pub-id> <pub-id pub-id-type="pmid">19961699</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rambaut</surname> <given-names>A.</given-names></name> <name><surname>Lam</surname> <given-names>T. T.</given-names></name> <name><surname>Max Carvalho</surname> <given-names>L.</given-names></name> <name><surname>Pybus</surname> <given-names>O. G.</given-names></name></person-group> (<year>2016</year>). <article-title>Exploring the temporal structure of heterochronous sequences using TempEst (formerly Path-O-Gen).</article-title> <source><italic>Virus Evol.</italic></source> <volume>2</volume>:<issue>vew007</issue>. <pub-id pub-id-type="doi">10.1093/ve/vew007</pub-id> <pub-id pub-id-type="pmid">27774300</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rice</surname> <given-names>P.</given-names></name> <name><surname>Longden</surname> <given-names>I.</given-names></name> <name><surname>Bleasby</surname> <given-names>A.</given-names></name></person-group> (<year>2000</year>). <article-title>EMBOSS: the European molecular biology open software suite.</article-title> <source><italic>Trends Genet.</italic></source> <volume>16</volume> <fpage>276</fpage>&#x2013;<lpage>277</lpage>. <pub-id pub-id-type="doi">10.1016/S0168-9525(00)02024-2</pub-id></citation></ref>
<ref id="B68"><citation citation-type="journal"><collab>Robert-Koch-Institut</collab> (<year>2015</year>). <source><italic>Infektionsepidemiologisches Jahrbuch Meldepflichtiger Krankheiten f&#x00FC;r 2015.</italic></source> <publisher-loc>Berlin</publisher-loc>: <publisher-name>Robert-Koch-Institut</publisher-name>.</citation></ref>
<ref id="B69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roberts</surname> <given-names>R. J.</given-names></name> <name><surname>Vincze</surname> <given-names>T.</given-names></name> <name><surname>Posfai</surname> <given-names>J.</given-names></name> <name><surname>Macelis</surname> <given-names>D.</given-names></name></person-group> (<year>2015</year>). <article-title>REBASE&#x2013;a database for DNA restriction and modification: enzymes, genes and genomes.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume> <fpage>D298</fpage>&#x2013;<lpage>D299</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gku1046</pub-id> <pub-id pub-id-type="pmid">25378308</pub-id></citation></ref>
<ref id="B70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rodriguez-R</surname> <given-names>L. M.</given-names></name> <name><surname>Konstantinidis</surname> <given-names>K. T.</given-names></name></person-group> (<year>2016</year>). <article-title>The enveomics collection: a toolbox for specialized analyses of microbial genomes and metagenomes.</article-title> <source><italic>PeerJ</italic></source> <volume>4</volume>:<issue>e1900v1</issue>.</citation></ref>
<ref id="B71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rohmer</surname> <given-names>L.</given-names></name> <name><surname>Fong</surname> <given-names>C.</given-names></name> <name><surname>Abmayr</surname> <given-names>S.</given-names></name> <name><surname>Wasnick</surname> <given-names>M.</given-names></name> <name><surname>Larson Freeman</surname> <given-names>T. J.</given-names></name> <name><surname>Radey</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Comparison of <italic>Francisella tularensis</italic> genomes reveals evolutionary events associated with the emergence of human pathogenic strains.</article-title> <source><italic>Genome Biol.</italic></source> <volume>8</volume>:<issue>R102</issue>. <pub-id pub-id-type="doi">10.1186/gb-2007-8-6-r102</pub-id> <pub-id pub-id-type="pmid">17550600</pub-id></citation></ref>
<ref id="B72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rotz</surname> <given-names>L. D.</given-names></name> <name><surname>Khan</surname> <given-names>A. S.</given-names></name> <name><surname>Lillibridge</surname> <given-names>S. R.</given-names></name> <name><surname>Ostroff</surname> <given-names>S. M.</given-names></name> <name><surname>Hughes</surname> <given-names>J. M.</given-names></name></person-group> (<year>2002</year>). <article-title>Public health assessment of potential biological terrorism agents.</article-title> <source><italic>Emerg. Infect. Dis.</italic></source> <volume>8</volume> <fpage>225</fpage>&#x2013;<lpage>230</lpage>. <pub-id pub-id-type="doi">10.3201/eid0802.010164</pub-id> <pub-id pub-id-type="pmid">11897082</pub-id></citation></ref>
<ref id="B73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rychener</surname> <given-names>L.</given-names></name> <name><surname>Inalbon</surname> <given-names>S.</given-names></name> <name><surname>Djordjevic</surname> <given-names>S. P.</given-names></name> <name><surname>Chowdhury</surname> <given-names>P. R.</given-names></name> <name><surname>Ziech</surname> <given-names>R. E.</given-names></name> <name><surname>De Vargas</surname> <given-names>A. C.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title><italic>Clostridium chauvoei</italic>, an evolutionary dead-end pathogen.</article-title> <source><italic>Front. Microbiol.</italic></source> <volume>8</volume>:<issue>1054</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2017.01054</pub-id> <pub-id pub-id-type="pmid">28649238</pub-id></citation></ref>
<ref id="B74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rydzewski</surname> <given-names>K.</given-names></name> <name><surname>Schulz</surname> <given-names>T.</given-names></name> <name><surname>Brzuszkiewicz</surname> <given-names>E.</given-names></name> <name><surname>Holland</surname> <given-names>G.</given-names></name> <name><surname>Luck</surname> <given-names>C.</given-names></name> <name><surname>Fleischer</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Genome sequence and phenotypic analysis of a first German <italic>Francisella</italic> sp. isolate (W12-1067) not belonging to the species <italic>Francisella tularensis</italic>.</article-title> <source><italic>BMC Microbiol.</italic></source> <volume>14</volume>:<issue>169</issue>. <pub-id pub-id-type="doi">10.1186/1471-2180-14-169</pub-id> <pub-id pub-id-type="pmid">24961323</pub-id></citation></ref>
<ref id="B75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sampson</surname> <given-names>T. R.</given-names></name> <name><surname>Saroj</surname> <given-names>S. D.</given-names></name> <name><surname>Llewellyn</surname> <given-names>A. C.</given-names></name> <name><surname>Tzeng</surname> <given-names>Y. L.</given-names></name> <name><surname>Weiss</surname> <given-names>D. S.</given-names></name></person-group> (<year>2013</year>). <article-title>A CRISPR/Cas system mediates bacterial innate immune evasion and virulence.</article-title> <source><italic>Nature</italic></source> <volume>497</volume> <fpage>254</fpage>&#x2013;<lpage>257</lpage>. <pub-id pub-id-type="doi">10.1038/nature12048</pub-id> <pub-id pub-id-type="pmid">23584588</pub-id></citation></ref>
<ref id="B76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schirmer</surname> <given-names>M.</given-names></name> <name><surname>Ijaz</surname> <given-names>U. Z.</given-names></name> <name><surname>D&#x2019;amore</surname> <given-names>R.</given-names></name> <name><surname>Hall</surname> <given-names>N.</given-names></name> <name><surname>Sloan</surname> <given-names>W. T.</given-names></name> <name><surname>Quince</surname> <given-names>C.</given-names></name></person-group> (<year>2015</year>). <article-title>Insight into biases and sequencing errors for amplicon sequencing with the Illumina MiSeq platform.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>43</volume>:<issue>e37</issue>. <pub-id pub-id-type="doi">10.1093/nar/gku1341</pub-id> <pub-id pub-id-type="pmid">25586220</pub-id></citation></ref>
<ref id="B77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schunder</surname> <given-names>E.</given-names></name> <name><surname>Rydzewski</surname> <given-names>K.</given-names></name> <name><surname>Grunow</surname> <given-names>R.</given-names></name> <name><surname>Heuner</surname> <given-names>K.</given-names></name></person-group> (<year>2013</year>). <article-title>First indication for a functional CRISPR/Cas system in <italic>Francisella tularensis</italic>.</article-title> <source><italic>Int. J. Med. Microbiol.</italic></source> <volume>303</volume> <fpage>51</fpage>&#x2013;<lpage>60</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijmm.2012.11.004</pub-id> <pub-id pub-id-type="pmid">23333731</pub-id></citation></ref>
<ref id="B78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seemann</surname> <given-names>T.</given-names></name></person-group> (<year>2014</year>). <article-title>Prokka: rapid prokaryotic genome annotation.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>2068</fpage>&#x2013;<lpage>2069</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu153</pub-id> <pub-id pub-id-type="pmid">24642063</pub-id></citation></ref>
<ref id="B79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Segata</surname> <given-names>N.</given-names></name> <name><surname>Bornigen</surname> <given-names>D.</given-names></name> <name><surname>Morgan</surname> <given-names>X. C.</given-names></name> <name><surname>Huttenhower</surname> <given-names>C.</given-names></name></person-group> (<year>2013</year>). <article-title>PhyloPhlAn is a new method for improved phylogenetic and taxonomic placement of microbes.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>4</volume>:<issue>2304</issue>. <pub-id pub-id-type="doi">10.1038/ncomms3304</pub-id> <pub-id pub-id-type="pmid">23942190</pub-id></citation></ref>
<ref id="B80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Seibold</surname> <given-names>E.</given-names></name> <name><surname>Bogumil</surname> <given-names>R.</given-names></name> <name><surname>Vorderwulbecke</surname> <given-names>S.</given-names></name> <name><surname>Al Dahouk</surname> <given-names>S.</given-names></name> <name><surname>Buckendahl</surname> <given-names>A.</given-names></name> <name><surname>Tomaso</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Optimized application of surface-enhanced laser desorption/ionization time-of-flight MS to differentiate <italic>Francisella tularensis</italic> at the level of subspecies and individual strains.</article-title> <source><italic>FEMS Immunol. Med. Microbiol.</italic></source> <volume>49</volume> <fpage>364</fpage>&#x2013;<lpage>373</lpage>. <pub-id pub-id-type="doi">10.1111/j.1574-695X.2007.00216.x</pub-id> <pub-id pub-id-type="pmid">17378900</pub-id></citation></ref>
<ref id="B81"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Simpson</surname> <given-names>J. T.</given-names></name> <name><surname>Wong</surname> <given-names>K.</given-names></name> <name><surname>Jackman</surname> <given-names>S. D.</given-names></name> <name><surname>Schein</surname> <given-names>J. E.</given-names></name> <name><surname>Jones</surname> <given-names>S. J.</given-names></name> <name><surname>Birol</surname> <given-names>I.</given-names></name></person-group> (<year>2009</year>). <article-title>ABySS: a parallel assembler for short read sequence data.</article-title> <source><italic>Genome Res.</italic></source> <volume>19</volume> <fpage>1117</fpage>&#x2013;<lpage>1123</lpage>. <pub-id pub-id-type="doi">10.1101/gr.089532.108</pub-id> <pub-id pub-id-type="pmid">19251739</pub-id></citation></ref>
<ref id="B82"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sjodin</surname> <given-names>A.</given-names></name> <name><surname>Svensson</surname> <given-names>K.</given-names></name> <name><surname>Ohrman</surname> <given-names>C.</given-names></name> <name><surname>Ahlinder</surname> <given-names>J.</given-names></name> <name><surname>Lindgren</surname> <given-names>P.</given-names></name> <name><surname>Duodu</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Genome characterisation of the genus <italic>Francisella</italic> reveals insight into similar evolutionary paths in pathogens of mammals and fish.</article-title> <source><italic>BMC Genomics</italic></source> <volume>13</volume>:<issue>268</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-13-268</pub-id> <pub-id pub-id-type="pmid">22727144</pub-id></citation></ref>
<ref id="B83"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stamatakis</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>RAxML version 8: a tool for phylogenetic analysis and post-analysis of large phylogenies.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1312</fpage>&#x2013;<lpage>1313</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu033</pub-id> <pub-id pub-id-type="pmid">24451623</pub-id></citation></ref>
<ref id="B84"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stanke</surname> <given-names>M.</given-names></name> <name><surname>Tzvetkova</surname> <given-names>A.</given-names></name> <name><surname>Morgenstern</surname> <given-names>B.</given-names></name></person-group> (<year>2006</year>). <article-title>AUGUSTUS at EGASP: using EST, protein and genomic alignments for improved gene prediction in the human genome.</article-title> <source><italic>Genome Biol.</italic></source> <volume>7(Suppl. 1)</volume>:<issue>S11</issue>. <pub-id pub-id-type="doi">10.1186/gb-2006-7-s1-s11</pub-id> <pub-id pub-id-type="pmid">16925833</pub-id></citation></ref>
<ref id="B85"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Svensson</surname> <given-names>K.</given-names></name> <name><surname>Back</surname> <given-names>E.</given-names></name> <name><surname>Eliasson</surname> <given-names>H.</given-names></name> <name><surname>Berglund</surname> <given-names>L.</given-names></name> <name><surname>Granberg</surname> <given-names>M.</given-names></name> <name><surname>Karlsson</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Landscape epidemiology of tularemia outbreaks in Sweden.</article-title> <source><italic>Emerg. Infect. Dis.</italic></source> <volume>15</volume> <fpage>1937</fpage>&#x2013;<lpage>1947</lpage>. <pub-id pub-id-type="doi">10.3201/eid1512.090487</pub-id> <pub-id pub-id-type="pmid">19961673</pub-id></citation></ref>
<ref id="B86"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Svensson</surname> <given-names>K.</given-names></name> <name><surname>Sjodin</surname> <given-names>A.</given-names></name> <name><surname>Bystrom</surname> <given-names>M.</given-names></name> <name><surname>Granberg</surname> <given-names>M.</given-names></name> <name><surname>Brittnacher</surname> <given-names>M. J.</given-names></name> <name><surname>Rohmer</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Genome sequence of <italic>Francisella tularensis</italic> subspecies <italic>holarctica</italic> strain FSC200 isolated from a child with tularemia.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>194</volume> <fpage>6965</fpage>&#x2013;<lpage>6966</lpage>. <pub-id pub-id-type="doi">10.1128/JB.01040-12</pub-id> <pub-id pub-id-type="pmid">23209222</pub-id></citation></ref>
<ref id="B87"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tange</surname> <given-names>O.</given-names></name></person-group> (<year>2011</year>). <article-title>GNU parallel - the command-line power tool.</article-title> <source><italic>USENIX Mag.</italic></source> <volume>36</volume> <fpage>42</fpage>&#x2013;<lpage>47</lpage>.</citation></ref>
<ref id="B88"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>T&#x00E4;rnvik</surname> <given-names>A.</given-names></name> <name><surname>Berglund</surname> <given-names>L.</given-names></name></person-group> (<year>2003</year>). <article-title>Tularaemia.</article-title> <source><italic>Eur. Respir. J.</italic></source> <volume>21</volume> <fpage>361</fpage>&#x2013;<lpage>373</lpage>. <pub-id pub-id-type="doi">10.1183/09031936.03.00088903</pub-id></citation></ref>
<ref id="B89"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tomaso</surname> <given-names>H.</given-names></name> <name><surname>Hotzel</surname> <given-names>H.</given-names></name> <name><surname>Otto</surname> <given-names>P.</given-names></name> <name><surname>Myrtennas</surname> <given-names>K.</given-names></name> <name><surname>Forsman</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>Antibiotic susceptibility in vitro of <italic>Francisella tularensis</italic> subsp. <italic>holarctica</italic> isolates from Germany.</article-title> <source><italic>J. Antimicrob. Chemother.</italic></source> <volume>72</volume> <fpage>2539</fpage>&#x2013;<lpage>2543</lpage>. <pub-id pub-id-type="doi">10.1093/jac/dkx182</pub-id> <pub-id pub-id-type="pmid">28605439</pub-id></citation></ref>
<ref id="B90"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tomaso</surname> <given-names>H.</given-names></name> <name><surname>Scholz</surname> <given-names>H. C.</given-names></name> <name><surname>Neubauer</surname> <given-names>H.</given-names></name> <name><surname>Al Dahouk</surname> <given-names>S.</given-names></name> <name><surname>Seibold</surname> <given-names>E.</given-names></name> <name><surname>Landt</surname> <given-names>O.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>Real-time PCR using hybridization probes for the rapid and specific identification of <italic>Francisella tularensis</italic> subspecies tularensis.</article-title> <source><italic>Mol. Cell. Probes</italic></source> <volume>21</volume> <fpage>12</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1016/j.mcp.2006.06.001</pub-id> <pub-id pub-id-type="pmid">16893624</pub-id></citation></ref>
<ref id="B91"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Treangen</surname> <given-names>T. J.</given-names></name> <name><surname>Ondov</surname> <given-names>B. D.</given-names></name> <name><surname>Koren</surname> <given-names>S.</given-names></name> <name><surname>Phillippy</surname> <given-names>A. M.</given-names></name></person-group> (<year>2014</year>). <article-title>The Harvest suite for rapid core-genome alignment and visualization of thousands of intraspecific microbial genomes.</article-title> <source><italic>Genome Biol.</italic></source> <volume>15</volume>:<issue>524</issue>. <pub-id pub-id-type="doi">10.1186/s13059-014-0524-x</pub-id> <pub-id pub-id-type="pmid">25410596</pub-id></citation></ref>
<ref id="B92"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ulland</surname> <given-names>T. K.</given-names></name> <name><surname>Janowski</surname> <given-names>A. M.</given-names></name> <name><surname>Buchan</surname> <given-names>B. W.</given-names></name> <name><surname>Faron</surname> <given-names>M.</given-names></name> <name><surname>Cassel</surname> <given-names>S. L.</given-names></name> <name><surname>Jones</surname> <given-names>B. D.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title><italic>Francisella tularensis</italic> live vaccine strain folate metabolism and pseudouridine synthase gene mutants modulate macrophage caspase-1 activation.</article-title> <source><italic>Infect. Immun.</italic></source> <volume>81</volume> <fpage>201</fpage>&#x2013;<lpage>208</lpage>. <pub-id pub-id-type="doi">10.1128/IAI.00991-12</pub-id> <pub-id pub-id-type="pmid">23115038</pub-id></citation></ref>
<ref id="B93"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van der Auwera</surname> <given-names>G. A.</given-names></name> <name><surname>Carneiro</surname> <given-names>M. O.</given-names></name> <name><surname>Hartl</surname> <given-names>C.</given-names></name> <name><surname>Poplin</surname> <given-names>R.</given-names></name> <name><surname>Del Angel</surname> <given-names>G.</given-names></name> <name><surname>Levy-Moonshine</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>From FastQ data to high confidence variant calls: the genome analysis toolkit best practices pipeline.</article-title> <source><italic>Curr. Protoc. Bioinformatics</italic></source> <volume>43</volume> <issue>11.10.1</issue>&#x2013;<issue>11.10.33</issue>. <pub-id pub-id-type="doi">10.1002/0471250953.bi1110s43</pub-id> <pub-id pub-id-type="pmid">25431634</pub-id></citation></ref>
<ref id="B94"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vogler</surname> <given-names>A. J.</given-names></name> <name><surname>Birdsell</surname> <given-names>D.</given-names></name> <name><surname>Price</surname> <given-names>L. B.</given-names></name> <name><surname>Bowers</surname> <given-names>J. R.</given-names></name> <name><surname>Beckstrom-Sternberg</surname> <given-names>S. M.</given-names></name> <name><surname>Auerbach</surname> <given-names>R. K.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>Phylogeography of <italic>Francisella tularensis</italic>: global expansion of a highly fit clone.</article-title> <source><italic>J. Bacteriol.</italic></source> <volume>191</volume> <fpage>2474</fpage>&#x2013;<lpage>2484</lpage>. <pub-id pub-id-type="doi">10.1128/JB.01786-08</pub-id> <pub-id pub-id-type="pmid">19251856</pub-id></citation></ref>
<ref id="B95"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vogler</surname> <given-names>A. J.</given-names></name> <name><surname>Birdsell</surname> <given-names>D. N.</given-names></name> <name><surname>Lee</surname> <given-names>J.</given-names></name> <name><surname>Vaissaire</surname> <given-names>J.</given-names></name> <name><surname>Doujet</surname> <given-names>C. L.</given-names></name> <name><surname>Lapalus</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Phylogeography of <italic>Francisella tularensis</italic> ssp. <italic>holarctica</italic> in France.</article-title> <source><italic>Lett. Appl. Microbiol.</italic></source> <volume>52</volume> <fpage>177</fpage>&#x2013;<lpage>180</lpage>. <pub-id pub-id-type="doi">10.1111/j.1472-765X.2010.02977.x</pub-id> <pub-id pub-id-type="pmid">21214606</pub-id></citation></ref>
<ref id="B96"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wick</surname> <given-names>R. R.</given-names></name> <name><surname>Schultz</surname> <given-names>M. B.</given-names></name> <name><surname>Zobel</surname> <given-names>J.</given-names></name> <name><surname>Holt</surname> <given-names>K. E.</given-names></name></person-group> (<year>2015</year>). <article-title>Bandage: interactive visualization of de novo genome assemblies.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>3350</fpage>&#x2013;<lpage>3352</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btv383</pub-id> <pub-id pub-id-type="pmid">26099265</pub-id></citation></ref>
<ref id="B97"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wion</surname> <given-names>D.</given-names></name> <name><surname>Casadesus</surname> <given-names>J.</given-names></name></person-group> (<year>2006</year>). <article-title>N6-methyl-adenine: an epigenetic signal for DNA-protein interactions.</article-title> <source><italic>Nat. Rev. Microbiol.</italic></source> <volume>4</volume> <fpage>183</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro1350</pub-id> <pub-id pub-id-type="pmid">16489347</pub-id></citation></ref>
<ref id="B98"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wood</surname> <given-names>D. E.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name></person-group> (<year>2014</year>). <article-title>Kraken: ultrafast metagenomic sequence classification using exact alignments.</article-title> <source><italic>Genome Biol.</italic></source> <volume>15</volume>:<issue>R46</issue>. <pub-id pub-id-type="doi">10.1186/gb-2014-15-3-r46</pub-id> <pub-id pub-id-type="pmid">24580807</pub-id></citation></ref>
<ref id="B99"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>Y.</given-names></name> <name><surname>Liang</surname> <given-names>Y.</given-names></name> <name><surname>Lynch</surname> <given-names>K. H.</given-names></name> <name><surname>Dennis</surname> <given-names>J. J.</given-names></name> <name><surname>Wishart</surname> <given-names>D. S.</given-names></name></person-group> (<year>2011</year>). <article-title>PHAST: a fast phage search tool.</article-title> <source><italic>Nucleic Acids Res.</italic></source> <volume>39</volume> <fpage>W347</fpage>&#x2013;<lpage>W352</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkr485</pub-id> <pub-id pub-id-type="pmid">21672955</pub-id></citation></ref>
<ref id="B100"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zimin</surname> <given-names>A. V.</given-names></name> <name><surname>Marcais</surname> <given-names>G.</given-names></name> <name><surname>Puiu</surname> <given-names>D.</given-names></name> <name><surname>Roberts</surname> <given-names>M.</given-names></name> <name><surname>Salzberg</surname> <given-names>S. L.</given-names></name> <name><surname>Yorke</surname> <given-names>J. A.</given-names></name></person-group> (<year>2013</year>). <article-title>The MaSuRCA genome assembler.</article-title> <source><italic>Bioinformatics</italic></source> <volume>29</volume> <fpage>2669</fpage>&#x2013;<lpage>2677</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt476</pub-id> <pub-id pub-id-type="pmid">23990416</pub-id></citation></ref>
</ref-list>
<fn-group>
<fn id="fn01"><label>1</label><p><ext-link ext-link-type="uri" xlink:href="https://github.com/adrlar/CanSNPer">https://github.com/adrlar/CanSNPer</ext-link></p></fn>
<fn id="fn02"><label>2</label><p><ext-link ext-link-type="uri" xlink:href="https://www.qiagenbioinformatics.com/">https://www.qiagenbioinformatics.com/</ext-link></p></fn>
<fn id="fn03"><label>3</label><p><ext-link ext-link-type="uri" xlink:href="http://nebc.nerc.ac.uk">http://nebc.nerc.ac.uk</ext-link></p></fn>
</fn-group>
</back>
</article>