<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Microbiol.</journal-id>
<journal-title>Frontiers in Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">1664-302X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmicb.2016.00813</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Identification of Quantitative Proteomic Differences between <italic>Mycobacterium tuberculosis</italic> Lineages with Altered Virulence</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Peters</surname> <given-names>Julian S.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x02020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Calder</surname> <given-names>Bridget</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x02020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/237477/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gonnelli</surname> <given-names>Giulia</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Degroeve</surname> <given-names>Sven</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Rajaonarifara</surname> <given-names>Elinambinina</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/333131/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Mulder</surname> <given-names>Nicola</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/29889/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Soares</surname> <given-names>Nelson C.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/166299/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Martens</surname> <given-names>Lennart</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Blackburn</surname> <given-names>Jonathan M.</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/214749/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Centre of Excellence for Biomedical TB Research, Witwatersrand University</institution> <country>Johannesburg, South Africa</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Integrative Biomedical Sciences, Institute of Infectious Diseases and Molecular Medicine, University of Cape Town</institution> <country>Cape Town, South Africa</country></aff>
<aff id="aff3"><sup>3</sup><institution>VIB, Ghent University</institution> <country>Ghent, Belgium</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Marc Bramkamp, Ludwig-Maximilians-University Munich, Germany</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Andreas Burkovski, Friedrich-Alexander-Universit&#x000E4;t Erlangen-N&#x000FC;rnberg, Germany; Julia Elisabeth Bandow, Ruhr-Universit&#x000E4;t Bochum, Germany</p></fn>
<fn fn-type="corresp" id="fn001"><p>&#x0002A;Correspondence: Jonathan M. Blackburn <email>jonathan.blackburn&#x00040;uct.ac.za</email></p></fn>
<fn fn-type="other" id="fn002"><p>This article was submitted to Microbial Physiology and Metabolism, a section of the journal Frontiers in Microbiology</p></fn>
<fn fn-type="other" id="fn003"><p>&#x02020;These authors have contributed equally to this work.</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>31</day>
<month>05</month>
<year>2016</year>
</pub-date>
<pub-date pub-type="collection">
<year>2016</year>
</pub-date>
<volume>7</volume>
<elocation-id>813</elocation-id>
<history>
<date date-type="received">
<day>23</day>
<month>01</month>
<year>2016</year>
</date>
<date date-type="accepted">
<day>12</day>
<month>05</month>
<year>2016</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2016 Peters, Calder, Gonnelli, Degroeve, Rajaonarifara, Mulder, Soares, Martens and Blackburn.</copyright-statement>
<copyright-year>2016</copyright-year>
<copyright-holder>Peters, Calder, Gonnelli, Degroeve, Rajaonarifara, Mulder, Soares, Martens and Blackburn</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) or licensor are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p>Evidence currently suggests that as a species <italic>Mycobacterium tuberculosis</italic> exhibits very little genomic sequence diversity. Despite limited genetic variability, members of the <italic>M. tuberculosis</italic> complex (MTBC) have been shown to exhibit vast discrepancies in phenotypic presentation in terms of virulence, elicited immune response and transmissibility. Here, we used qualitative and quantitative mass spectrometry tools to investigate the proteomes of seven clinically-relevant mycobacterial strains&#x02014;four <italic>M. tuberculosis</italic> strains, <italic>M. bovis, M. bovis</italic> BCG, and <italic>M. avium</italic>&#x02014;that show varying degrees of pathogenicity and virulence, in an effort to rationalize the observed phenotypic differences. Following protein preparation, liquid chromatography mass spectrometry (LC MS/MS) and data capture were carried out using an LTQ Orbitrap Velos. Data analysis was carried out using a novel bioinformatics strategy, which yielded high protein coverage and was based on high confidence peptides. Through this approach, we directly identified a total of 3788 unique <italic>M. tuberculosis</italic> proteins out of a theoretical proteome of 4023 proteins and identified an average of 3290 unique proteins for each of the MTBC organisms (representing 82% of the theoretical proteomes), as well as 4250 unique <italic>M. avium</italic> proteins (80% of the theoretical proteome). Data analysis showed that all major classes of proteins are represented in every strain, but that there are significant quantitative differences between strains. Targeted selected reaction monitoring (SRM) assays were used to quantify the observed differential expression of a subset of 23 proteins identified by comparison to gene expression data as being of particular relevance to virulence. This analysis revealed differences in relative protein abundance between strains for proteins which may promote bacterial fitness in the more virulent W. Beijing strain. These differences may contribute to this strain&#x00027;s capacity for surviving within the host and resisting treatment, which has contributed to its rapid spread. Through this approach, we have begun to describe the proteomic portrait of a successful mycobacterial pathogen. Data are available via ProteomeXchange with identifier PXD004165.</p></abstract>
<kwd-group>
<kwd><italic>Mycobacterium tuberculosis</italic></kwd>
<kwd>virulence</kwd>
<kwd>proteomics</kwd>
<kwd>SRM</kwd>
<kwd>fitness</kwd>
<kwd>stress response</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="35"/>
<page-count count="11"/>
<word-count count="8552"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Tuberculosis disease is caused by the bacterium <italic>Mycobacterium tuberculosis</italic>, and remains one of the leading causes of death by a single pathogen worldwide. Despite the presence of a vaccine and a number of antibiotics for the disease, it continues to cause about 2 million deaths and 8 million new cases worldwide per year. The emergence of multiple and extremely drug resistant strains, together with HIV co-infection, are fuelling the pandemic-especially in developing countries. Furthermore, latent and sub-clinical tuberculosis infection compounds tuberculosis control strategies by creating an unseen pathogenic reservoir. Even though various strains of <italic>M. tuberculosis</italic> have whole genome sequences available, the bacterium still closely guards the secrets of its success as a human pathogen.</p>
<p>According to whole-genome analysis, members of the <italic>M. tuberculosis</italic> complex (MTBC) exhibit the greatest degree of genetic conservation above all other pathogenic bacteria (99.9%). This strict level of observed genetic homogeneity initially led to the assumption that genetic variety amongst different strains would not be of any clinical significance (Homolka et al., <xref ref-type="bibr" rid="B15">2008</xref>). However, subsequent research has led to the understanding that traits manifested by members of the MTBC are influenced by the genetic and evolutionary background of the strains (Gagneux and Small, <xref ref-type="bibr" rid="B12">2007</xref>). Although, thousands of strains have been identified, only a few seem to drive widespread disease outbreaks and multi-drug resistance (Bifani et al., <xref ref-type="bibr" rid="B2">2002</xref>). <italic>M. tuberculosis</italic> isolates have been observed to exhibit vast discrepancies in phenotypic presentation especially with regard to clinical outcome and epidemiological behavior (Shimono et al., <xref ref-type="bibr" rid="B29">2003</xref>; Baker et al., <xref ref-type="bibr" rid="B1">2004</xref>; Gagneux and Small, <xref ref-type="bibr" rid="B12">2007</xref>; Nicol and Wilkinson, <xref ref-type="bibr" rid="B20">2008</xref>). The East Asian/Beijing <italic>M. tuberculosis</italic> lineage is particularly of interest due to its increasing prevalence in the global TB community, implying an apparent selective advantage compared to existing strains (Parwati et al., <xref ref-type="bibr" rid="B21">2010</xref>). It is therefore cause for concern that modern Beijing lineages appear to be accumulating mutations which enhance pathogenicity, apparently under positive selection pressure (Merker et al., <xref ref-type="bibr" rid="B19">2015</xref>). The exact mode by which increased pathogenicity is conferred in this lineage remains undetermined and is likely to be a combination of factors (Ribeiro et al., <xref ref-type="bibr" rid="B23">2014</xref>), however some proposed mechanisms include enhanced stress response, drug resistance and altered host-pathogen interactions, as has been reviewed previously (Hanekom et al., <xref ref-type="bibr" rid="B14">2011</xref>; Warner et al., <xref ref-type="bibr" rid="B35">2015</xref>). On the other hand, some closely related strains in the <italic>M. tuberculosis</italic> complex (MTBC) have attenuated virulence in humans (such as the vaccine strain BCG), or are not typically human pathogens and will only opportunistically infect immunocompromised humans (Desforges and Horsburgh, <xref ref-type="bibr" rid="B7">1991</xref>; Wang and Behr, <xref ref-type="bibr" rid="B34">2014</xref>; Halstrom et al., <xref ref-type="bibr" rid="B13">2015</xref>).</p>
<p>Whilst genetic variation across multiple strains has been studied in depth, the clinical and epidemiological consequences of genetic differences between mycobacterial strains remains poorly understood (Malik and Godfrey-Faussett, <xref ref-type="bibr" rid="B16">2005</xref>). As a consequence, it is not known whether the proteome is comparatively static between different strains of <italic>M. tuberculosis</italic> or whether quantitative differences in the expressed proteomes could contribute in some way to differential virulence. Here, we used liquid chromatography mass spectrometry (LC-MS)-based proteomics to define and compare the proteomic complement of 6 clinically relevant mycobacterial strains within the MTBC as well as a strain of <italic>Mycobacterium avium</italic> as an outlier. While these strains are all pathogenic in principal, the extent to which they cause disease in humans varies greatly. We therefore aimed to identify protein expression profiles that might correlate with altered virulence amongst these strains by comparing more pathogenic strains in the MTBC to less pathogenic <italic>Mycobacterium bovis</italic>, BCG and <italic>M. avium</italic> strains.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and methods</title>
<p><italic>M. tuberculosis</italic> isolates H37Rv, W-Beijing, CAS and LAM3 were obtained from the Medical Microbiology Division of the University of Cape Town. The clinical strains representing lineages 2 (Beijing), 3 (CAS), and 4 (LAM3/F11) were isolated from pediatric patients from Red Cross war memorial hospital, Cape Town. <italic>M. tuberculosis</italic> H37Rv was used in all assays as a reference strain. Phylogeny of the isolates was determined using spoligotyping and MIRU-VNTR described in Sarkar et al. (<xref ref-type="bibr" rid="B25">2012</xref>) and is shown in Supplementary Table <xref ref-type="supplementary-material" rid="SM1">1</xref>. The Danish strain of <italic>M. bovis</italic> BCG was used in this study. The <italic>M. avium</italic> strain was obtained from the National Health Laboratory Services (NHLS) laboratory and was verified using line probe assays. <italic>M. bovis</italic> was obtained from Stellenbosch University Health Sciences Department in Tygerberg Hospital, Cape Town.</p>
<sec>
<title>Cell culture</title>
<p>Cells were maintained in wholly synthetic Sautons media (2% glycerol, 0.4% L-asparagine, 0.2% glucose, 0.2% citric acid, 0.05% mono-potassium phosphate, 0.05% magnesium sulfate, 0.015% Tween 80, 0.005% ferric citrate, 0.00001% zinc sulfate at pH 7.4). Briefly, 190 ml of Sautons medium was inoculated with a 10 ml starter culture (approximately 10<sup>8</sup> bacteria/ml). The flasks were sealed and incubated at 37&#x000B0;C and 5% CO<sub>2</sub> with gentle agitation until OD<sub>600</sub> reached 0.9 (approximately 6 weeks).</p>
</sec>
<sec>
<title>Protein extraction</title>
<p>Proteins were extracted in a Biosafety level 3 facility in line with health and safety guidelines. Briefly, the cell pellet was separated from the culture filtrate by centrifugation at 4000 &#x000D7; g for 15 min in a bench-top centrifuge. Cell lysis was carried out by boiling the cell pellet in 1% SDS buffer (1% SDS, 100 mM Tris-HCl pH 7.6, 0.1 mM dithiothreitol (DTT), 1 mM PMSF) for 30 min. Cell debris was separated from the protein containing supernatant by centrifugation at 10,000 &#x000D7; g for 15 min in a bench top centrifuge and the supernatant containing the protein was transferred into a clean tube. Protein extracts from cell lysates were concentrated and buffer exchanged to 2 M urea buffer using 3 kDa MWCO filters (Millipore). Culture filtrate proteins were concentrated and buffer exchanged into 2 M urea using 15 ml 10 kDa MWCO filters. Protein concentration was determined using the BCA assay kit (Thermo Scientific). A 10 kDa MWCO filter was used for the culture filtrate instead of a 3 kDa because this is the lowest filter size available for large volumes, however, according to manufacturer&#x00027;s product specifications (Millipore), proteins as low as 3 kDa are still retained on 10 kDa MWCO filters.</p>
</sec>
<sec>
<title>Protein separation (1D SDS PAGE)</title>
<p>Proteins were separated according to molecular weight using an SDS PAGE gel system. The separating gels were made from 10% acrylamide: bis-acrylamide, 0.375 M Tris-HCl (pH 8.8), 7.5% SDS, 0.5% ammonium persulphate and 0.1% TEMED. The stacking gels consisted of 4% acrylamide: bis-acrylamide, 0.125 M Tris-HCl (pH 6.8), 0.1% SDS, 0.5% ammonium persulphate and 0.1% TEMED. 40 &#x003BC;g of each sample (culture filtrate and intracellular protein) was mixed with an equal volume of 2x sample buffer and heated at 65&#x000B0;C for 5 min. Electrophoresis was performed from anode to cathode at 100 V using a BioRad mini-Protean II gel system until the bromophenol blue dye reached the bottom of the gel.</p>
</sec>
<sec>
<title>Protein visualization</title>
<p>Visualization of the proteins on the gel was performed using Coomasie brilliant blue R250 for 1 h (50% methanol, 10% acetic acid and 0.1% Coomasie brilliant blue R250). Destaining of the gels was carried out by incubating on a shaker overnight at room temperature in destaining solution (10% methanol, 10% acetic acid).</p>
</sec>
<sec>
<title>In gel trypsin digestion</title>
<p>Each gel lane for each strain sample was divided into 5 pieces (i.e., 5 culture filtrate fractions and 5 intracellular protein fractions, hence a total of 10 fractions per strain). Each gel piece was cut into smaller cubes and washed twice with water followed by 50% (v/v) acetonitrile for 10 min. The acetonitrile was replaced with 50 mM ammonium bicarbonate and incubated for 10 min. Washes with 50 mM ammonium bicarbonate were repeated twice to remove acetonitrile. All the gel pieces were then incubated in 100% acetonitrile until they turned white, after which the gel pieces were dried <italic>in vacuo</italic>. Proteins were reduced with 10 mM DTT for 1 h at 57&#x000B0;C. This was followed by brief washing steps of ammonium bicarbonate followed by 50% acetonitrile before proteins were alkylated with 55 mM iodoacetamide for 1 h in the dark. Following alkylation, the gel slices were washed with ammonium bicarbonate for 10 min followed by 50% acetonitrile for 20 min, before being dried <italic>in vacuo</italic>. The proteins in the gel cubes were digested with trypsin (Promega) at 37&#x000B0;C overnight in a 1:50 trypsin: protein ratio. The resulting peptides were extracted twice with 70% acetonitrile in 0.1% formic acid for 30 min and then dried and stored at &#x02212;20&#x000B0;C. Dried peptides were dissolved in 5% acetonitrile in 0.1% formic acid and 10 &#x003BC;l injections were made for nano-LC chromatography.</p>
</sec>
<sec>
<title>Mass spectrometry</title>
<p>All experiments were performed on a Thermo Scientific EASY-nLC II coupled to an LTQ Orbitrap Velos mass spectrometer (Thermo Scientific, Bremen, Germany) equipped with a nano-electrospray source. For liquid chromatography, separation was performed on an EASY-Column (2 cm, ID 100 &#x003BC;m, 5 &#x003BC;m, C18) pre-column followed by a, EASY-column (10 cm, ID 75 &#x003BC;m, 3 &#x003BC;m, C18) column with a flow rate of 300 nl/min. The gradient used was from 5&#x02013;15% B in 5 min, 15&#x02013;35% B in 90 min, 35&#x02013;60% B in 10 min, 60&#x02013;80% B in 5 min, and kept at 80% B for 10 min. Solvent A was 100% water in 0.1% formic acid; solvent B was 100% acetonitrile in 0.1% formic acid. MS/MS data was acquired from the Orbitrap Velos in Top 20 CID mode.</p>
</sec>
<sec>
<title>Post MS data analysis</title>
<p>Raw data was captured from the mass spectrometer and converted to MS2 files using MakeMS2 software (Thermo Scientific). The data was then analyzed using Crux (McIlwain et al., <xref ref-type="bibr" rid="B17">2014</xref>) and Mascot (Cottrell and London, <xref ref-type="bibr" rid="B4">1999</xref>), and the output of MS2PIP (Degroeve and Martens, <xref ref-type="bibr" rid="B6">2013</xref>) was used additional features for the Percolator algorithm. Spectra were obtained from each fraction of the gel (a total of 5 fractions per strain) and were viewed using Peaks v5.3. The mass spectrometry proteomics data have been deposited to the ProteomeXchange Consortium via the PRIDE (Vizca&#x000ED;no et al., <xref ref-type="bibr" rid="B33">2016</xref>) partner repository with the dataset identifier PXD004165.</p>
</sec>
<sec>
<title>Protein preparation for SRM-MS</title>
<p>Proteins were extracted in the BSL3 facility in line with health and safety guidelines as described in Section Protein extraction. Protein concentration was determined using a BCA assay according to manufacturer&#x00027;s protocol (&#x00023;23227, Thermo Fisher Scientific). Protein preparation was performed using a filter aided sample preparation (FASP) method. Briefly, 200 &#x003BC;g of each protein sample was placed into a 10 KDa molecular weight cut off filter (MWCO) (Millipore). Protein cysteine residues were alkylated in the dark for 30 min in 10 mM iodoacetamide. Iodoacteamide was then removed by centrifugation at 14,000 &#x000D7; g for 15 min. Buffer exchange was performed twice with 8 M urea in 0.1 mM Tris-HCl pH 8.5 by centrifugation at 14,000 &#x000D7; g for 15 min in a refrigerated bench-top centrifuge at 18&#x000B0;C. The urea buffer was then exchanged for 0.05 M ammonium bicarbonate by centrifugation. Sequencing-grade modified trypsin (&#x00023;608-274-4330, Promega) was added at a ratio of 1:100 enzyme: substrate and incubated overnight at 37&#x000B0;C in a wet chamber. The peptides were finally collected through the filter into a clean collection tube by centrifugation at 14 000 &#x000D7; g for 10 min.</p>
<p>To stop the tryptic digest the pH was lowered to 2 using 50% trifluoro acetic acid (TFA) followed by an incubation for 15 min at 37&#x000B0;C with shaking at 500 rpm. The peptide solution was desalted with C18 reversed-phase columns (Pierce &#x00023;89870-25) according to the manufacturer&#x00027;s instructions. Briefly, the C18 columns were activated with 50% methanol, followed by equilibration with 5% ACN: 0.5% TFA. After loading the sample, the columns were washed 3 times with 5% ACN: 0.5% TFA. Finally, peptides were eluted with 70% ACN, dried under vacuum, and re-solubilized in 0.1% FA to a final concentration of 8 &#x003BC;g/&#x003BC;l.</p>
</sec>
<sec>
<title>SRM mass spectrometry</title>
<p>All SRM experiments were performed on a TSQ Vantage triple quadrupole mass spectrometer (Thermo Fisher Scientific) equipped with a heated electrospray II ion source. For liquid chromatography and separation of peptides, a Synergi 4 &#x003BC; Hydro RP 150 &#x000D7; 4.60 mm 80 &#x000C5; pore size C18 column (serial &#x00023; 630710-14) was used with a column flow rate of 300 &#x003BC;l/min. The gradient used was from 5&#x02013;15% B in 5 min, 15&#x02013;35% B in 90 min, 35&#x02013;60% B in 10 min, 60&#x02013;80% B in 5 min and kept at 80% B for 10 min. Solvent A was 100% water in 0.1% formic acid, and solvent B was 100% acetonitrile in 0.1% formic acid.</p>
<p>The mass spectrometer was operated in positive mode using electrospray ionization with a voltage of 3500 V. The capillary temperature was set to 350&#x000B0;C and the collision gas pressure to 1.2 mTorr. Up to 336 transitions per run were acquired with a cycle time of 3 s and a dwell time of at least 20 ms. Collision energies were calculated per individual peptide transition ion using Skyline software and further optimized by a series of energy ramping experimental steps (10 steps of 5 V) to obtain the optimum energy of each transition. MS/MS data was acquired from the CID mode. Raw data was captured from the mass spectrometer and analyzed using Skyline software.</p>
<p>The proteins chosen for SRM analysis were based on relevance in pathogenicity and/or virulence as stated in literature as shown in Supplementary Table <xref ref-type="supplementary-material" rid="SM2">2</xref>. To design SRM assays, peptides were chosen for analysis based on their prior observation in our discovery experiments. Although, each protein was typically observed by two or more peptides in the discovery experiment, the two best performing peptides were chosen to confirm each protein in the SRM assay, with the exception of 2 proteins (Rv1818c and Rv0833) (Supplementary Table <xref ref-type="supplementary-material" rid="SM3">3</xref>). Due to the small size and non-redundant nature of the <italic>M. tuberculosis</italic> proteome, 3 ion transitions were set as the minimum number required to identify a peptide in an SRM assay.</p>
</sec>
<sec>
<title>SRM data analysis</title>
<p>Data analysis was carried out using Skyline software (MacCoss Lab software). Intra-assay ambiguity (CV) for each peptide was based on the calculated average protein concentration for a set of technical duplicate injections of each sample. Inter-assay CV was calculated for each peptide from across three biological replicates of the 7 strains. Quantitation of each peptide was carried out using the area under the curve for the peptide transitions assayed in Skyline. Retention times for the peptide standards were obtained by pre-assessment on the MS. For peptides without standards, the retention times were obtained from predictions made by Skyline software and gated at 5 s from the predicted retention time.</p>
</sec>
<sec>
<title>Protein inference</title>
<p>The protein databases used to generate theoretical spectra were strain specific individual non-redundant fasta files obtained from Ensembl (<ext-link ext-link-type="uri" xlink:href="http://www.ensembl.org">www.ensembl.org</ext-link>), with the exception of LAM for which there is no Ensembl annotation, and W-Beijing whose annotated file is not sufficient for downstream cross strain comparison. For LAM, the UniProt fasta file was used (<ext-link ext-link-type="uri" xlink:href="http://www.uniprot.org">www.uniprot.org</ext-link>) and for W-Beijing, the H37Rv Ensembl fasta file was used. The parameters were standard across both searches and included carbamidomethylation of cysteine residues as a fixed modification and oxidation of methionine residues as a variable modification. Two missed cleavages were allowed and peptide mass tolerance was set at 10 ppm whilst fragment mass tolerance was set to 0.5 Da. Decoy databases were used for FDR analysis and a cut-off was set at 5% for protein identifications.</p>
<p>The PSMs obtained from the search were used to predict the expressed protein repertoire of each sample. MS/MS spectra from the 10 fractions per strain were searched with each individual search engine. Combining results from multiple search engines yields higher protein identifications (Shteynberg et al., <xref ref-type="bibr" rid="B30">2013</xref>), and therefore all the proteins identified from each individual search engine were combined and redundancy was removed to give one complete non-redundant dataset per study organism.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>Total protein extracts from the discovery MS approach were quantified using BCA assay with concentrations ranging between 2.5&#x02013;15 &#x003BC;g/&#x003BC;l for total cellular proteins and 10&#x02013;40 &#x003BC;g/&#x003BC;l for culture filtrate proteins. Each tryptically digested sample was analyzed on the Orbitrap Velos to produce an LC-MS and MS/MS dataset. To assess the efficiency of the tryptic digest a descriptive analysis software package in Protein Pilot was used and the results are summarized in Supplementary Table <xref ref-type="supplementary-material" rid="SM4">4</xref>.</p>
<p>As shown in Supplementary Figure <xref ref-type="supplementary-material" rid="SM6">1A</xref>, the MS1 scan of H37Rv confirms a successful tryptic digest with the total ion chromatogram in showing a steady elution of peptides across the LC gradient. The 2D MS chromatogram (Supplementary Figure <xref ref-type="supplementary-material" rid="SM6">1B</xref>) demonstrates the complexity of the sample, showing a significant number of discrete tryptic peptides eluting at the marked time point indicated on the 1D chromatogram (&#x0007E;2600 s).</p>
<p>For the analysis of the MS2 spectra a software pipeline was implemented that combines the results of different peptide identification strategies. At the core of our pipeline is the semi-supervised learning algorithm implemented in Percolator (Brosch et al., <xref ref-type="bibr" rid="B3">2009</xref>) that has been shown to obtain high identification sensitivity. The first tool in the pipeline is Crux (McIlwain et al., <xref ref-type="bibr" rid="B17">2014</xref>) which is a reimplementation of the popular tool Sequest with added post-processing by the Percolator algorithm. The second tool is Mascot (Cottrell and London, <xref ref-type="bibr" rid="B4">1999</xref>) for which again Percolator was used to post-process the MOWSE identification scores<xref ref-type="fn" rid="fn0001"><sup>1</sup></xref>.</p>
<p>The Percolator tool allows for adding new features that can be exploited by the semi-supervised learning algorithm to further increase peptide identification sensitivity. It has been shown that adding features obtained from MS2 peak intensity predictions can significantly increase sensitivity (Sun et al., <xref ref-type="bibr" rid="B31">2007</xref>). Therefore, we employed the MS2PIP (Degroeve and Martens, <xref ref-type="bibr" rid="B6">2013</xref>) tool to predict the b- and y-ion peak intensities for all peptides suggested by Mascot (top ranked peptide for each MS2 spectrum). We then computed several features from the difference between the predicted and the observed MS2 peak intensities, such as the Pearson correlation. We observed that adding these features to the Percolator algorithm for Mascot did indeed increase identification sensitivity significantly.</p>
<p>Comparison of protein numbers obtained at 1% and 5% FDR showed that the use of 5% FDR allows a substantial increase in the absolute number of true positives with an insignificant increase in the absolute number of false positives, hence providing an apparently favorable trade-off in true positives over false positives (Figure <xref ref-type="fig" rid="F1">1</xref>). The final proteome obtained from each strain using all algorithms represented a high proportion of the theoretical protein fasta files for each strain, as shown in Table <xref ref-type="table" rid="T1">1</xref>.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p><bold>(A)</bold> The contribution of each of the search engines to the total number of non-redundant proteins obtained per strain at 5% FDR. Mascot is shown in blue bars, Crux is shown in red bars, Mascot&#x0002B;MS2PIP&#x0002B;Percolator is shown in green bars and the total non-redundant library is shown in purple bars. <bold>(B)</bold> The comparison between 1 and 5% FDR across all strains. This illustrates the total number of proteins obtained for each strain at each FDR, and the proportion of true and false positives in that FDR bracket.</p></caption>
<graphic xlink:href="fmicb-07-00813-g0001.tif"/>
</fig>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p><bold>Total non-redundant number of proteins obtained in the experiment compared to the total number of proteins in the theoretical fasta file</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Strain</bold></th>
<th valign="top" align="center"><bold>Total &#x00023; proteins in fasta file</bold></th>
<th valign="top" align="center"><bold>Total &#x00023; detected experimentally (5% FDR)</bold></th>
<th valign="top" align="center"><bold>% of total theoretical proteome found</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><italic>M. avium</italic></td>
<td valign="top" align="center">5314</td>
<td valign="top" align="center">4250</td>
<td valign="top" align="center">80</td>
</tr>
<tr>
<td valign="top" align="left"><italic>M. tuberculosis H37Rv</italic></td>
<td valign="top" align="center">4049</td>
<td valign="top" align="center">3539</td>
<td valign="top" align="center">87</td>
</tr>
<tr>
<td valign="top" align="left"><italic>M. tuberculosis Beijing</italic></td>
<td valign="top" align="center">4049</td>
<td valign="top" align="center">3224</td>
<td valign="top" align="center">80</td>
</tr>
<tr>
<td valign="top" align="left"><italic>M. tuberculosis CAS</italic></td>
<td valign="top" align="center">4049</td>
<td valign="top" align="center">2746</td>
<td valign="top" align="center">68</td>
</tr>
<tr>
<td valign="top" align="left"><italic>M. tuberculosis LAM</italic></td>
<td valign="top" align="center">3904</td>
<td valign="top" align="center">3500</td>
<td valign="top" align="center">90</td>
</tr>
<tr>
<td valign="top" align="left"><italic>M. bovis BCG</italic></td>
<td valign="top" align="center">4041</td>
<td valign="top" align="center">3272</td>
<td valign="top" align="center">81</td>
</tr>
<tr>
<td valign="top" align="left"><italic>M. bovis</italic></td>
<td valign="top" align="center">4001</td>
<td valign="top" align="center">3461</td>
<td valign="top" align="center">87</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec>
<title>Data alignment for downstream comparison</title>
<p>To carry out an effective cross strain comparison, it was crucial to ensure that as much of the theoretical proteome as possible was observed by discovery MS. After obtaining a non-redundant dataset for each strain using strain specific databases, it became necessary to convert all the protein IDs into a standard protein ID by orthology mapping to allow effective cross strain comparison. To achieve this, the total non-redundant IDs from each strain obtained by searching against its individual Ensembl fasta file were then mapped back to the Ensembl H37Rv protein IDs. These were all in turn mapped to UniProt accession numbers and Tuberculist &#x0201C;Rv&#x0201D; loci numbers to facilitate downstream analysis with tools such as GO analysis and pathway mapping. It was observed that there is a slight deficiency in ortholog mapping data between databases (Ensembl and UniProt), as well as shortcomings in ortholog mapping between strains. These discrepancies lead to a minor loss of information, as represented in Figure <xref ref-type="fig" rid="F2">2</xref>. The discrepancy in ortholog mapping was much more pronounced when mapping protein IDs to H37Rv from the more distantly related <italic>M. avium</italic>, which lies outside the MTBC group; this resulted in loss of approximately 50% of the biological information in downstream comparisons to <italic>M. avium</italic>. Other strains showed relatively small losses in the number of experimentally observed proteins mapped to H37Rv orthologs, for instance the LAM strain had approximately 600 proteins with no orthologs in H37Rv which were therefore not included in the cross-species comparison.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p><bold>The losses in number of identified proteins obtained after experimental ortholog mapping to <italic><bold>M. tuberculosis</bold></italic> H37Rv for each strain</bold>. <italic>Avium</italic>&#x02014;<italic>Mycobacterium avium</italic>, H37Rv&#x02014;<italic>Mycobacterium tuberculosis</italic> H37Rv, Beijing&#x02014;<italic>Mycobacterium tuberculosis</italic> W. Beijing, CAS&#x02014;<italic>Mycobacterium tuberculosis</italic> CAS, LAM&#x02014;<italic>Mycobacterium tuberculosis</italic> LAM, BCG&#x02014;<italic>Mycobacterium bovis</italic> BCG, Bovis&#x02014;<italic>Mycobacterium bovis</italic>.</p></caption>
<graphic xlink:href="fmicb-07-00813-g0002.tif"/>
</fig>
</sec>
<sec>
<title>Qualitative cross species comparison</title>
<p>With congruent IDs, strains were cross-compared to obtain a comprehensive qualitative comparison as summarized in Figure <xref ref-type="fig" rid="F3">3</xref> using the Venn diagram tool Venny [267]. Protein IDs from the 4 <italic>Mycobacterium tuberculosis</italic> strains were compared (Figure <xref ref-type="fig" rid="F3">3A</xref>) and, as expected, the majority of observed proteins were found to be shared amongst all <italic>M. tuberculosis</italic> strains, with less than 5% being strain specific. A total of 1938 proteins comprise the shared proteins among the 4 <italic>M. tuberculosis</italic> strains, perhaps representing a <italic>M. tuberculosis</italic> core proteome. A second diagram was generated comparing the collective, non-redundant proteomes of the four <italic>M. tuberculosis</italic> strains to those of <italic>M. bovis</italic>, BCG, <italic>M. avium</italic> (Figure <xref ref-type="fig" rid="F3">3B</xref>). Surprisingly, <italic>M. avium</italic> had many proteins in common with the MTBC strains, with only 12 unique proteins apparently unique to <italic>M. avium</italic>; this may simply reflect though the deficiencies in ortholog mapping between more distantly related organisms. The four <italic>M. tuberculosis</italic> strains also share 989 common proteins with <italic>M. bovis</italic> and BCG which they do not share with <italic>M. avium</italic>. A group of 168 was observed uniquely in the <italic>M. tuberculosis</italic> strains and not found in <italic>M. bovis</italic>, BCG or <italic>M. avium</italic>; these proteins were therefore earmarked as candidate virulence factors to be further explored.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p><bold>Qualitative cross strain/species data analysis. (A)</bold> Venn diagram showing the overlap in the numbers of protein identifications between the 4 strictly <italic>Mycobacterium tuberculosis</italic> strains CAS, LAM, W-Beijing, and H37Rv. <bold>(B)</bold> Venn diagram representing the comparison between the collective non-redundant proteins obtained in the 4 strictly <italic>M. tuberculosis</italic> strains (CAS, LAM, W-Beijing, and H37Rv) denoted &#x0201C;Human clinical strains&#x0201D; and those of <italic>M. bovis</italic>, BCG, and <italic>M. avium</italic>.</p></caption>
<graphic xlink:href="fmicb-07-00813-g0003.tif"/>
</fig>
</sec>
<sec>
<title>Protein expression profiling</title>
<p>We subsequently sought to quantitatively assess a subset of the candidate virulence factors identified by discovery MS and cross-strain comparison using selected reaction monitoring (SRM)&#x02014;a sensitive, reproducible and quantitative MS technique. Since the design of SRM robust assays can be a lengthy process and the capacity to highly multiplex hundreds of SRM assays remains challenging, we devised a strategy to create a short list of candidate proteins with possible relevance in differential clinical phenotypes observed between the <italic>M. tuberculosis</italic> isolates for subsequent quantitative proteomic analysis. To do this, we compared our proteomic data on each of the 168 proteins (Supplementary Table <xref ref-type="supplementary-material" rid="SM5">5</xref>) that were observed only in the <italic>M. tuberculosis</italic> strains with 771 gene expression data sets contained in the TBDB, representing varying <italic>in vitro</italic> models of TB disease. We focussed attention in particular on 7 categories of experiment from the TBDB that aimed to more closely reflect <italic>in vivo</italic> conditions (e.g., starvation models, macrophage infection models, hypoxic models, etc.), the logic being that consistent over-expression of a protein in one of those categories might plausibly confer a selective advantage to the bacterium <italic>in vivo</italic>; the categories chosen are listed in Table <xref ref-type="table" rid="T2">2</xref>.</p>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p><bold>The number of significantly differentially expressed proteins from the 168 proteins unique to human clinical strains segregated into over- or under-expressed per category assessed (<ext-link ext-link-type="uri" xlink:href="http://www.tbdb.org">www.tbdb.org</ext-link>)</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>TBDB Experiment</bold></th>
<th valign="top" align="center"><bold>Over-expressed</bold></th>
<th valign="top" align="center"><bold>Under-expressed</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Acid media</td>
<td valign="top" align="center">58</td>
<td valign="top" align="center">38</td>
</tr>
<tr>
<td valign="top" align="left">Macrophage</td>
<td valign="top" align="center">18</td>
<td valign="top" align="center">53</td>
</tr>
<tr>
<td valign="top" align="left">Hypoxia</td>
<td valign="top" align="center">59</td>
<td valign="top" align="center">49</td>
</tr>
<tr>
<td valign="top" align="left">NO treatment</td>
<td valign="top" align="center">78</td>
<td valign="top" align="center">32</td>
</tr>
<tr>
<td valign="top" align="left">Starvation</td>
<td valign="top" align="center">51</td>
<td valign="top" align="center">26</td>
</tr>
<tr>
<td valign="top" align="left">Persistence</td>
<td valign="top" align="center">23</td>
<td valign="top" align="center">43</td>
</tr>
<tr>
<td valign="top" align="left">Antibiotics</td>
<td valign="top" align="center">40</td>
<td valign="top" align="center">54</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>For each of the 168 proteins, we assessed whether they were significantly over- or under-expressed in each of the 7 chosen categories of gene expression models and carried out statistical analysis on the gene expression values obtained from the TBDB experiments using packages in R (strategy depicted in Figure <xref ref-type="fig" rid="F4">4</xref>). Proteins from the 168 protein set whose gene expression showed an average fold change of &#x02265;2 SD from the mean across all datasets in an individual condition were taken as significantly differentially expressed in that condition. Proteins that had significant fold change for fewer than 4 out of the 7 categories were removed from this list, resulting in a final shortlist of 23 proteins, summarized in Table <xref ref-type="table" rid="T3">3</xref>. In order to create SRM assays for the shortlisted proteins, the <italic>M. tuberculosis</italic> proteome library (Schubert et al., <xref ref-type="bibr" rid="B28">2013</xref>) was consulted and validated SRM assays for the proteins of interest were extracted.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p><bold>Gene expression analysis approach of the short list of 168 proteins expressed in human clinical strains</bold>. Expression ratio data was obtained from the chosen TBDB experiments and statistical packages in R were used to convert the ratios into fold changes. Analysis of the fold changes was done in R to indicate proteins that have significant fold changes (&#x02265;2 from the mean) which are shown in the scatterplot above and below the shaded area.</p></caption>
<graphic xlink:href="fmicb-07-00813-g0004.tif"/>
</fig>
<table-wrap position="float" id="T3">
<label>Table 3</label>
<caption><p><bold>The 23 mycobacterial proteins identified in discovery proteomic experiments which were subsequently selected for quantitative targeted proteomic analysis</bold>.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Rv locus</bold></th>
<th valign="top" align="left"><bold>Function and prediction from gene expression data</bold></th>
<th valign="top" align="center"><bold><italic>p</italic>-value</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Rv0301</td>
<td valign="top" align="left">VapC2; toxin; possible mRNAse; impaired growth when expressed | macrophage infection models</td>
<td valign="top" align="center">6,75E-07</td>
</tr>
<tr>
<td valign="top" align="left">Rv0899</td>
<td valign="top" align="left">ArfA; outer membrane porin A; tolerance to acidic conditions, impaired growth at pH 5.5</td>
<td valign="top" align="center">5,55E-08</td>
</tr>
<tr>
<td valign="top" align="left">Rv0901</td>
<td valign="top" align="left">ArfC; unknown function; tolerance to acidic conditions, impaired growth at pH 5.5</td>
<td valign="top" align="center">6,42E-06</td>
</tr>
<tr>
<td valign="top" align="left">Rv0966</td>
<td valign="top" align="left">Unknown function; highly activated in the early stages of tuberculosis blood brain barrier invasion (CNS TB)</td>
<td valign="top" align="center">1,96E-05</td>
</tr>
<tr>
<td valign="top" align="left">Rv1002c</td>
<td valign="top" align="left">Pmt; probable mannosyltransferase; conserved membrane protein growth and survival in host</td>
<td valign="top" align="center">9,35E-07</td>
</tr>
<tr>
<td valign="top" align="left">Rv1346</td>
<td valign="top" align="left">MbtN; mycobactin biosynthesis; adaptation to intracellular environment | stress response models</td>
<td valign="top" align="center">0,020716</td>
</tr>
<tr>
<td valign="top" align="left">Rv1380</td>
<td valign="top" align="left">PyrB; pyrimidine biosynthesis; essential for growth; high confidence drug target | drug response models</td>
<td valign="top" align="center">0,039441</td>
</tr>
<tr>
<td valign="top" align="left">Rv1381</td>
<td valign="top" align="left">PyrC; pyrimidine biosynthesis; growth and survival in host | drug response models</td>
<td valign="top" align="center">4,59E-09</td>
</tr>
<tr>
<td valign="top" align="left">Rv1383</td>
<td valign="top" align="left">CarA; pyrimidine biosynthesis; growth and survival in host | drug response models</td>
<td valign="top" align="center">1,08E-06</td>
</tr>
<tr>
<td valign="top" align="left">Rv1384</td>
<td valign="top" align="left">CarB; pyrimidine biosynthesis; growth and survival in host</td>
<td valign="top" align="center">4,47E-09</td>
</tr>
<tr>
<td valign="top" align="left">Rv1980c</td>
<td valign="top" align="left">Mpt64; Unknown function; tolerance to starvation, highly immunogenic; vaccine and drug target potential</td>
<td valign="top" align="center">0,422015</td>
</tr>
<tr>
<td valign="top" align="left">Rv1997</td>
<td valign="top" align="left">CtpF; Metal cation-transporting ATPase; implicated in dormancy/persistance, response to hypoxia, NO</td>
<td valign="top" align="center">6,10E-06</td>
</tr>
<tr>
<td valign="top" align="left">Rv2108</td>
<td valign="top" align="left">PPE36; unknown function; immuno-active membrane component; diagnostic and vaccine target</td>
<td valign="top" align="center">0,876293</td>
</tr>
<tr>
<td valign="top" align="left">Rv2126c</td>
<td valign="top" align="left">PE_PGRS37; unknown function; possible virulence/adaptation</td>
<td valign="top" align="center">0,988059</td>
</tr>
<tr>
<td valign="top" align="left">Rv2136c</td>
<td valign="top" align="left">UppP; undecaprenyl pyrophosphatase; high confidence drug target | host immune evasion and virulence models</td>
<td valign="top" align="center">5,32E-12</td>
</tr>
<tr>
<td valign="top" align="left">Rv2156</td>
<td valign="top" align="left">MraY; peptidoglycan biosynthesis; growth and survival in host, high confidence drug target</td>
<td valign="top" align="center">0,97868</td>
</tr>
<tr>
<td valign="top" align="left">Rv2703</td>
<td valign="top" align="left">SigA; primary sigma factor in <italic>M. tuberculosis</italic>; host immune response modulator, virulence, growth in host, high confidence drug target | host immune evasion and virulence models</td>
<td valign="top" align="center">0,026023</td>
</tr>
<tr>
<td valign="top" align="left">Rv3340</td>
<td valign="top" align="left">MetC; methionine biosynthesis; growth and survival in host</td>
<td valign="top" align="center">0,649041</td>
</tr>
<tr>
<td valign="top" align="left">Rv3412</td>
<td valign="top" align="left">Unknown function; hypothetical protein; essential for cholesterol metabolism, essential during infection</td>
<td valign="top" align="center">3,27E-07</td>
</tr>
<tr>
<td valign="top" align="left">Rv3621c</td>
<td valign="top" align="left">PPE65; unknown function; possible virulence/adaptation</td>
<td valign="top" align="center">0,035777</td>
</tr>
<tr>
<td valign="top" align="left">Rv3709c</td>
<td valign="top" align="left">Ask; asparate kinase; survival in host</td>
<td valign="top" align="center">1,23E-05</td>
</tr>
<tr>
<td valign="top" align="left">Rv1818</td>
<td valign="top" align="left">PE-PGRS33; unknown function; modulation of host immune response, response to oxygen and starvation</td>
<td valign="top" align="center">1,61E-06</td>
</tr>
<tr>
<td valign="top" align="left">Rv0833</td>
<td valign="top" align="left">PE_PGRS13; unknown function; possible virulence/adaptation</td>
<td valign="top" align="center">9,79E-08</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>A minimum of 2 peptides per protein and 3 transitions per peptide were assessed by SRM for the shortlisted proteins in all seven strains. Intra-assay and inter-assay coefficients of variation were determined for each individual peptide. Intra assay variability was based on 3 technical replicates per strain whilst inter assay variability was assessed based on 2 biological replicates. The signal of each peptide observed was obtained by summing the peak areas of each measured transition for that peptide and then normalizing by the total number of cells per strain at the point of protein extraction. An ANOVA test was used to determine if there was a significant difference in the expression of each of the peptides representing each protein. The single factor ANOVA results (Table <xref ref-type="table" rid="T3">3</xref>) shows that of the 23 peptides assessed, 18 had a significant difference in expression between the 7 strains. The proteins were then broadly classified into 4 groups denoting some aspect of the organisms&#x00027; success in the host (Supplementary Figure <xref ref-type="supplementary-material" rid="SM6">2</xref>) in order to aid further interpretation of the data.</p>
<p>The four proteins assayed with roles in drug response are PyrB, PyrC, CarA, and CarB, and all form part of the pyrimidine biosynthetic operon in <italic>M. tuberculosis</italic>. All with the exception of carB (Rv1384) are more abundant in <italic>M. avium</italic> compared to the other strains, but within the MTBC the Beijing strain has the highest expression of PyrB, PyrC, and CarA.</p>
<p>Amongst proteins which are known to modulate the host immune response, the uncharacterized hypothetical protein Rv0966 is highly expressed in the LAM strain compared to the other strains. In this functional category, Rv2136c, Rv1002, Rv2703, and Rv2108 are more abundant in the Beijing strain. Rv1818c appears to be more abundant in the CAS strain while in the other strains it is present at comparatively low amounts.</p>
<p>Amongst proteins responsible for the growth of <italic>M. tuberculosis</italic> in the host, a possible toxin with unknown function, VapC2 (Rv0301), has the highest relative expression in the Beijing strain. PE_PGRS13 (Rv0833), MetC (Rv3340), and conserved hypothetical protein Rv3412 are all more abundant in the LAM strain than in BCG or <italic>M. avium</italic>, although similarly highly abundant in H37Rv and <italic>M. bovis</italic>. PPE65 (Rv3621c) appears to be upregulated in both LAM and <italic>M. avium</italic> strains.</p>
<p>In terms of adaptation to stress, the Acyl-CoA dehydrogenase MbtN (Rv1346) is particularly abundant in the Beijing strain. The protein Rv0901 is apparently less abundant in <italic>M. bovis</italic> and BCG strains whereas it is relatively abundant in the other strains, particularly so in H37Rv and <italic>M. avium</italic>. Aspartate kinase (Rv3709c) is more abundant in H37Rv and LAM strains comparatively, and almost entirely absent in <italic>M. avium</italic> and <italic>M. bovis</italic>.</p>
<p>The contribution to total signal detected for each protein as measured by SRM in each of the 7 strains is represented in Figure <xref ref-type="fig" rid="F5">5</xref>. This analysis demonstrates that proteins which were detected in a particular strain in the discovery experiment, e.g., Rv0301 and Rv1002c which were observed only in the Beijing strain, tend to contribute the highest signal when measured by SRM. This appears to be clearly the case for 14 of the 23 proteins assessed (Rv0301, Rv1381, Rv1383, Rv1002c, Rv3709c, Rv1346, Rv3412, Rv2108, Rv3621, Rv0833, Rv0966c, Rv1818c, Rv2136c, and Rv3340).</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p><bold>Comparison of relative protein quantity per strain for the 23 mycobacterial proteins as determined by SRM</bold>. Each color in the stacked bar represents the percentage contribution of that strain to the total detected amount of each protein.</p></caption>
<graphic xlink:href="fmicb-07-00813-g0005.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Although, genetically similar, different strains of <italic>M. tuberculosis</italic> present very different clinical phenotypes in terms of virulence. We therefore postulated that there may be a proteomic mechanism underpinning the differences in pathogenicity observed between strains of <italic>M. tuberculosis</italic> and we explored this possibility using discovery and targeted mass spectrometry techniques. In order to reveal candidate proteins that might be involved in differential pathogenicity, we aimed to compare proteomes between individual pathogenic and non-pathogenic mycobacteria, noting that both BCG and <italic>M. avium</italic> can cause TB-like disease in immune compromised individuals, suggesting that their pathogenicity is attenuated, not lost entirely. To underpin our intended cross-strain and cross-species proteomic comparisons, we first carried out an exhaustive mass spectrometry-based discovery proteomics analysis of the 7 mycobacterial strains. Through use of a sophisticated bioinformatic strategy, combining data from multiple search engines, we obtained &#x0003E;80% coverage at the protein level for 6 out of the 7 theoretical proteomes. Combining data across the 4 <italic>M. tuberculosis</italic> strains, we identified a total of 3788 <italic>M. tuberculosis</italic> proteins with high confidence, meaning that we failed to observe only 235 out of the predicted 4023 proteins in the <italic>M. tuberculosis</italic> proteome. To our knowledge, this level of discovery proteomic coverage across multiple <italic>M. tuberculosis</italic> strains is unprecedented, although we note that recently reported SWATH-based analyses on <italic>M. tuberculosis</italic> H37Rv have come close to this figure (Schubert et al., <xref ref-type="bibr" rid="B27">2015</xref>). Surprisingly, although the 23 proteins subsequently quantified by SRM were initially observed only in the <italic>M. tuberculosis</italic> strains by discovery MS analysis, they were in fact all identified in all 7 strains by SRM analysis, albeit with relative quantifications that correlated to a large degree with our discovery data. Furthermore, SRM analysis of 45 predicted <italic>M. tuberculosis</italic> proteins that had not been observed in our discovery MS analysis of any of the 7 mycobacterial strains revealed that half were in fact expressed in each of the <italic>M. tuberculosis</italic> strains (data not shown), presumably reflecting low absolute expression levels for those proteins, below the detection limit for discovery MS. Taken together, our data suggests that the total expressed complement of proteins is remarkably similar in the different clinical strains of <italic>M. tuberculosis</italic> and moreover that virtually the entire <italic>M. tuberculosis</italic> proteome is expressed in all strains, at least under optimal <italic>in vitro</italic> conditions. However, our data also clearly demonstrates that significant, quantitative differences in expression levels exist between strains which may directly influence the phenotype of these strains. While it is possible that protein quantity does not track with the enzyme activity of that protein in a cell, due to allosteric effects or post-translational modifications, enzyme activity was not measured in our study.</p>
<p>Cross-strain and cross-species comparisons of our semi-quantitative discovery proteomics data were limited only by the relatively poor ortholog mapping found between <italic>M. avium</italic> and <italic>M. tuberculosis</italic> H37Rv and enabled identification of 168 proteins that were originally observed only in the <italic>M. tuberculosis</italic> strains and were therefore considered candidates that might contribute to the differential virulence of these mycobacterial strains. However, we were conscious that our proteomic data had been generated under one set of culture conditions that were likely far removed from the true host environment in TB disease. We therefore cross-correlated our proteomic data with 771 gene expression models deposited in the TBDB, covering a wide range of different <italic>in vitro</italic> culture conditions and exogenous stresses on <italic>M. tuberculosis</italic> that can be thought of as mimicking various aspects of the host environment (e.g., macrophage infection; hypoxia; starvation; etc.). The genes for 23 of the 168 proteins were found to be significantly up- or down-regulated in macrophage-based and related <italic>in vitro</italic> gene expression models of TB disease and we therefore carried out quantitative analysis of their protein expression <italic>in vitro</italic> across the 7 strains, focussing particularly on differential expression in the Beijing and LAM lineages that are known to have particularly virulent clinical phenotypes (Pillay and Sturm, <xref ref-type="bibr" rid="B22">2007</xref>; Cowley et al., <xref ref-type="bibr" rid="B5">2008</xref>).</p>
<p>One of <italic>M. tuberculosis</italic>&#x00027;s many features as a pathogen is its ability to evade the host innate and acquired immune responses such that it is capable of attaining latency and can potentially remain relatively quiescent in alveolar macrophages for decades (Flynn and Chan, <xref ref-type="bibr" rid="B10">2003</xref>). Here, we identified four proteins which modulate the host immune response which are significantly more abundant in the Beijing strain compared to other strains and may therefore have functional significance in conferring virulence in <italic>M. tuberculosis&#x02014;</italic>Rv2136c, Rv1002c, Rv2703, and Rv2108. Mutant <italic>M. tuberculosis</italic> with insertionally inactivated Rv2136c, a known virulence factor of the MTBC (Forrellad et al., <xref ref-type="bibr" rid="B11">2013</xref>), has severe hypersensitivity to acid and a number of other stresses (Vandal et al., <xref ref-type="bibr" rid="B32">2009</xref>). Rv2136c (uppP) is an undecaprenyl pyrophosphate phosphatase which recycles undecaprenyl pyrophosphate back to undecaprenyl phosphate so that it can act again as a receptor for the UDP-MurNAc-pentapeptide to make C55-PP-MurNAc-pentapeptide (lipid 1). The antibiotic Bacitracin inhibits peptidoglycan synthesis by sequestering undecaprenyl diphosphate, thereby reducing the pool of lipid carrier available, whilst increased expression of uppP provides resistance; by extension, Rv2703c might therefore be involved in virulence by speeding up the recycling of key lipid intermediates and hence cell wall biosynthesis, thus conferring a selectable advantage on the virulent Beijing strains. Similarly, sigma factor A (sigA), Rv2703, is the primary sigma factor in this bacterium and is essential for growth. Increased initiation of transcription, and thus RNA processing capacity, may therefore be another mechanism by which this strain has achieved hypervirulence, perhaps coupled to the observed increased expression of several proteins involved in pyrimidine biosynthesis (pyrB, pyr C, CarA). Although the function of Rv1002c is unknown, it is essential for growth in H37Rv (Sassetti et al., <xref ref-type="bibr" rid="B26">2003</xref>), whereas the PPE family protein PPE36 (Rv2108) has no known function and is non-essential for growth in H37Rv. Both of these proteins therefore represent attractive targets for further investigation.</p>
<p>Once inside the host macrophage, <italic>M. tuberculosis</italic> becomes dependent on the intracellular environment for sources of carbon (McKinney et al., <xref ref-type="bibr" rid="B18">2000</xref>; Eisenreich et al., <xref ref-type="bibr" rid="B9">2010</xref>) and iron. The acyl-CoA dehydrogenase, MbtN (Rv1346), is involved in the production of mycobactins which are thought to be vital for the acquisition of iron within the macrophage and are therefore considered to be virulence factors (De Voss et al., <xref ref-type="bibr" rid="B8">2000</xref>). It is notable therefore that MbtN protein was significantly more abundant in the Beijing strain, suggesting that this strain&#x00027;s capacity to acquire iron intracellularly may be superior. The capacity to produce essential amino acids in the host may also provide a selective advantage in terms of virulence, as demonstrated by the increased relative abundance of the O-acetylhomoserine sulfhydrylase MetC (Rv3340) and aspartate kinase Ask (Rv3709c) in the LAM strain.</p>
<p>Another important feature of intracellular <italic>M. tuberculosis</italic> in the persistent phase is the toxin/antitoxin system, of which <italic>M. tuberculosis</italic> has a remarkable 79 encoded loci (Sala et al., <xref ref-type="bibr" rid="B24">2014</xref>). Here we found that the possible toxin VapC2 (Rv0301) was significantly more abundant in the Beijing strain than other clinical strains. Vap C has been reported to suppress translation by hydrolysis of mRNA, so its increased expression in the Beijing strain may represent an evolutionary advantage by providing an efficient means to erase previous transcriptional profiles, thus allowing <italic>M. tuberculosis</italic> to rapidly reprogram the proteome and hence change the metabolic state of the cell in response to rapidly changing external stresses during the bacterium&#x00027;s host-based lifecycle.</p>
<p>Finally, proteins with unknown function are clear targets for further investigation&#x02014;for example the PE_PGRS and PPE family proteins which are known virulence factors yet currently have no functional categorization. Both PE_PGRS13 (Rv0833) and PPE65 (Rv3621c) as well as conserved hypothetical proteins Rv0966 and Rv3412 are abundant in the LAM strain. Interestingly, Rv0901&#x02014;a possible exported or membrane protein with unknown function&#x02014;is abundant in all measured strains except for <italic>M. bovis</italic> and BCG, both of which have attenuated pathogenicity. The loss of this protein could therefore alter the pathogenicity of the bacterium, indicating that this protein is a potential therapeutic target.</p>
<p>An important caveat for any quantitative <italic>in vitro</italic> study on <italic>M. tuberculosis</italic> that aims to correlate gene or protein expression levels with <italic>in vivo</italic> clinical phenotypes is that significant differences in expression observed under specific <italic>in vitro</italic> conditions may not accurately reflect the situation at the site of disease due to altered environmental influences on expression. This is further compounded by the fact that it is not currently technically possible to isolate sufficient <italic>M. tuberculosis</italic> bacilli from the site of disease in a human lung for a discovery proteomics experiment and by the fact that the clinical definitions of &#x0201C;virulence&#x0201D; and &#x0201C;pathogenicity&#x0201D; are themselves largely qualitative. In order to mitigate this caveat, we therefore correlated our quantiative proteomic data with over 700 gene expression models of TB disease&#x02014;themselves acquired under a number of different <italic>in vitro</italic> conditions that each mimic in some way aspects of the stress likely to be experienced by <italic>M. tuberculosis</italic> at the site of disease&#x02014;in order to provide a logical means to infer biological significance from <italic>in vitro</italic> data with greater confidence. A testable prediction from the <italic>in vitro</italic> quantitative proteomic data presented here is thus that the observed differential expression of specific mycobacterial proteins across these 7 strains when cultured under a common set of environmental conditions will affect clinical phenotype <italic>in vivo</italic>. However, the true role of these proteins in virulence will need to be validated in due course by targeted analysis of limiting numbers of <italic>M. tuberculosis</italic> bacilli isolated from the site of disease.</p>
</sec>
<sec sec-type="conclusions" id="s5">
<title>Conclusion</title>
<p>Through our combined discovery- and quantitative proteomic analysis of differential protein expression in 7 mycobacterial strains of varying pathogenicity and virulence, we have uncovered previously unknown, statistically significant quantitative differences in the expression of numerous proteins which begin to shed new light on differential virulence in <italic>M. tuberculosis</italic> strains. In particular, our data suggests strain specific bacterial fitness in the W-Beijing lineage, including: the ability to rapidly remodel the <italic>M. tuberculosis</italic> proteome in response to altered environments; up-regulation of key sigma factors to support rapid transcriptional responses; up-regulation of enzymes involved in pyrimidine biosynthesis and cell wall biosynthesis to promote rapid growth; enhanced mycobactin biosynthesis to promote iron scavenging in the host. These individually selectable traits may then conceivably work together to provide the W-Beijing lineage with an enhanced ability to establish primary infection and active TB disease in a new host. These are testable hypotheses and further research is underway on this now.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>JP carried out research, wrote initial draft. BC analyzed data, refined and rewrote initial draft to produce final draft. GG, SD, ER, NM, NS, LM assisted with data analysis and JB is principal investigator.</p>
<sec>
<title>Conflict of interest statement</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</sec>
</body>
<back>
<ack>
<p>We thank the South African Medical Research Council for Fellowships. JB acknowledges the South African National Research Foundation for the Research Chair grant. We would like to acknowledge Olga Schubert and Ruedi Aebersold for access to the <italic>M. tb</italic> SRM Atlas pre-publication.</p>
</ack>
<sec sec-type="supplementary-material" id="s7">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="http://journal.frontiersin.org/article/10.3389/fmicb.2016.00813">http://journal.frontiersin.org/article/10.3389/fmicb.2016.00813</ext-link></p>
<supplementary-material xlink:href="Table1.DOCX" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.XLSX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table3.XLSX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table4.DOCX" id="SM4" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table5.XLSX" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.PDF" id="SM6" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Baker</surname> <given-names>L.</given-names></name> <name><surname>Brown</surname> <given-names>T.</given-names></name> <name><surname>Maiden</surname> <given-names>M. C.</given-names></name> <name><surname>Drobniewski</surname> <given-names>F.</given-names></name></person-group> (<year>2004</year>). <article-title>Silent nucleotide polymorphisms and a phylogeny for <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Emerg. Infect. Dis.</source> <volume>10</volume>, <fpage>1568</fpage>&#x02013;<lpage>1577</lpage>. <pub-id pub-id-type="doi">10.3201/eid1009.040046</pub-id><pub-id pub-id-type="pmid">15498158</pub-id></citation>
</ref>
<ref id="B2">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bifani</surname> <given-names>P. J.</given-names></name> <name><surname>Mathema</surname> <given-names>B.</given-names></name> <name><surname>Kurepina</surname> <given-names>N. E.</given-names></name> <name><surname>Kreiswirth</surname> <given-names>B. N.</given-names></name></person-group> (<year>2002</year>). <article-title>Global dissemination of the <italic>Mycobacterium tuberculosis</italic> W-Beijing family strains</article-title>. <source>Trends Microbiol.</source> <volume>10</volume>, <fpage>45</fpage>&#x02013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1016/S0966-842X(01)02277-6</pub-id><pub-id pub-id-type="pmid">11755085</pub-id></citation>
</ref>
<ref id="B3">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Brosch</surname> <given-names>M.</given-names></name> <name><surname>Yu</surname> <given-names>L.</given-names></name> <name><surname>Hubbard</surname> <given-names>T.</given-names></name> <name><surname>Choudhary</surname> <given-names>J.</given-names></name></person-group> (<year>2009</year>). <article-title>Accurate and sensitive peptide identification with Mascot Percolator</article-title>. <source>J. Proteome Res.</source> <volume>8</volume>, <fpage>3176</fpage>&#x02013;<lpage>3181</lpage>. <pub-id pub-id-type="doi">10.1021/pr800982s</pub-id><pub-id pub-id-type="pmid">19338334</pub-id></citation>
</ref>
<ref id="B4">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cottrell</surname> <given-names>J. S.</given-names></name> <name><surname>London</surname> <given-names>U.</given-names></name></person-group> (<year>1999</year>). <article-title>Probability-based protein identification by searching sequence databases using mass spectrometry data</article-title>. <source>Electrophoresis</source> <volume>20</volume>, <fpage>3551</fpage>&#x02013;<lpage>3567</lpage>. <pub-id pub-id-type="pmid">10612281</pub-id></citation>
</ref>
<ref id="B5">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cowley</surname> <given-names>D.</given-names></name> <name><surname>Govender</surname> <given-names>D.</given-names></name> <name><surname>February</surname> <given-names>B.</given-names></name> <name><surname>Wolfe</surname> <given-names>M.</given-names></name> <name><surname>Steyn</surname> <given-names>L.</given-names></name> <name><surname>Evans</surname> <given-names>J.</given-names></name> <etal/></person-group>. (<year>2008</year>). <article-title>Recent and rapid emergence of W-Beijing strains of <italic>Mycobacterium tuberculosis</italic> in Cape Town, South Africa</article-title>. <source>Clin. Infect. Dis.</source> <volume>47</volume>, <fpage>1252</fpage>&#x02013;<lpage>1259</lpage>. <pub-id pub-id-type="doi">10.1086/592575</pub-id><pub-id pub-id-type="pmid">18834315</pub-id></citation>
</ref>
<ref id="B6">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Degroeve</surname> <given-names>S.</given-names></name> <name><surname>Martens</surname> <given-names>L.</given-names></name></person-group> (<year>2013</year>). <article-title>MS2PIP: a tool for MS/MS peak intensity prediction</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>3199</fpage>&#x02013;<lpage>3203</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt544</pub-id><pub-id pub-id-type="pmid">24078703</pub-id></citation>
</ref>
<ref id="B7">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Desforges</surname> <given-names>J. F.</given-names></name> <name><surname>Horsburgh</surname> <given-names>C. R.</given-names> <suffix>Jr.</suffix></name></person-group> (<year>1991</year>). <article-title><italic>Mycobacterium avium</italic> complex infection in the acquired immunodeficiency syndrome</article-title>. <source>N. Engl. J. Med.</source> <volume>324</volume>, <fpage>1332</fpage>&#x02013;<lpage>1338</lpage>. <pub-id pub-id-type="pmid">2017230</pub-id></citation>
</ref>
<ref id="B8">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>De Voss</surname> <given-names>J. J.</given-names></name> <name><surname>Rutter</surname> <given-names>K.</given-names></name> <name><surname>Schroeder</surname> <given-names>B. G.</given-names></name> <name><surname>Su</surname> <given-names>H.</given-names></name> <name><surname>Zhu</surname> <given-names>Y.</given-names></name> <name><surname>Barry</surname> <given-names>C. E.</given-names></name></person-group> (<year>2000</year>). <article-title>The salicylate-derived mycobactin siderophores of <italic>Mycobacterium tuberculosis</italic> are essential for growth in macrophages</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>97</volume>, <fpage>1252</fpage>&#x02013;<lpage>1257</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.97.3.1252</pub-id><pub-id pub-id-type="pmid">10655517</pub-id></citation>
</ref>
<ref id="B9">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Eisenreich</surname> <given-names>W.</given-names></name> <name><surname>Dandekar</surname> <given-names>T.</given-names></name> <name><surname>Heesemann</surname> <given-names>J.</given-names></name> <name><surname>Goebel</surname> <given-names>W.</given-names></name></person-group> (<year>2010</year>). <article-title>Carbon metabolism of intracellular bacterial pathogens and possible links to virulence</article-title>. <source>Nat. Rev. Microbiol.</source> <volume>8</volume>, <fpage>401</fpage>&#x02013;<lpage>412</lpage>. <pub-id pub-id-type="doi">10.1038/nrmicro2351</pub-id><pub-id pub-id-type="pmid">20453875</pub-id></citation>
</ref>
<ref id="B10">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Flynn</surname> <given-names>J. L.</given-names></name> <name><surname>Chan</surname> <given-names>J.</given-names></name></person-group> (<year>2003</year>). <article-title>Immune evasion by <italic>Mycobacterium tuberculosis</italic>: living with the enemy</article-title>. <source>Curr. Opin. Immunol.</source> <volume>15</volume>, <fpage>450</fpage>&#x02013;<lpage>455</lpage>. <pub-id pub-id-type="doi">10.1016/S0952-7915(03)00075-X</pub-id><pub-id pub-id-type="pmid">12900278</pub-id></citation>
</ref>
<ref id="B11">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Forrellad</surname> <given-names>M. A.</given-names></name> <name><surname>Klepp</surname> <given-names>L. I.</given-names></name> <name><surname>Gioffr&#x000E9;</surname> <given-names>A.</given-names></name> <name><surname>Sabio y Garc&#x000ED;a</surname> <given-names>J.</given-names></name> <name><surname>Morbidoni</surname> <given-names>H. R.</given-names></name> <name><surname>de la Paz Santangelo</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>Virulence factors of the <italic>Mycobacterium tuberculosis</italic> complex</article-title>. <source>Virulence</source> <volume>4</volume>, <fpage>3</fpage>&#x02013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.4161/viru.22329</pub-id><pub-id pub-id-type="pmid">23076359</pub-id></citation>
</ref>
<ref id="B12">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gagneux</surname> <given-names>S.</given-names></name> <name><surname>Small</surname> <given-names>P. M.</given-names></name></person-group> (<year>2007</year>). <article-title>Global phylogeography of <italic>Mycobacterium tuberculosis</italic> and implications for tuberculosis product development</article-title>. <source>Lancet Infect. Dis.</source> <volume>7</volume>, <fpage>328</fpage>&#x02013;<lpage>337</lpage>. <pub-id pub-id-type="doi">10.1016/S1473-3099(07)70108-1</pub-id><pub-id pub-id-type="pmid">17448936</pub-id></citation>
</ref>
<ref id="B13">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Halstrom</surname> <given-names>S.</given-names></name> <name><surname>Price</surname> <given-names>P.</given-names></name> <name><surname>Thomson</surname> <given-names>R.</given-names></name></person-group> (<year>2015</year>). <article-title>Review: environmental mycobacteria as a cause of human infection</article-title>. <source>Int. J. Mycobacteriol.</source> <volume>4</volume>, <fpage>81</fpage>&#x02013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1016/j.ijmyco.2015.03.002</pub-id><pub-id pub-id-type="pmid">26972876</pub-id></citation>
</ref>
<ref id="B14">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hanekom</surname> <given-names>M.</given-names></name> <name><surname>Gey van Pittius</surname> <given-names>N. C.</given-names></name> <name><surname>McEvoy</surname> <given-names>C.</given-names></name> <name><surname>Victor</surname> <given-names>T. C.</given-names></name> <name><surname>Van Helden</surname> <given-names>P. D.</given-names></name> <name><surname>Warren</surname> <given-names>R. M.</given-names></name></person-group> (<year>2011</year>). <article-title><italic>Mycobacterium tuberculosis</italic> Beijing genotype: a template for success</article-title>. <source>Tuberculosis (Edinb).</source> <volume>91</volume>, <fpage>510</fpage>&#x02013;<lpage>523</lpage>. <pub-id pub-id-type="doi">10.1016/j.tube.2011.07.005</pub-id><pub-id pub-id-type="pmid">21835699</pub-id></citation>
</ref>
<ref id="B15">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Homolka</surname> <given-names>S.</given-names></name> <name><surname>Post</surname> <given-names>E.</given-names></name> <name><surname>Oberhauser</surname> <given-names>B.</given-names></name> <name><surname>George</surname> <given-names>A. G.</given-names></name> <name><surname>Westman</surname> <given-names>L.</given-names></name> <name><surname>Dafae</surname> <given-names>F.</given-names></name> <etal/></person-group>. (<year>2008</year>). <article-title>High genetic diversity among <italic>Mycobacterium tuberculosis</italic> complex strains from Sierra Leone</article-title>. <source>BMC Microbiol.</source> <volume>8</volume>:<fpage>103</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2180-8-103</pub-id><pub-id pub-id-type="pmid">18578864</pub-id></citation>
</ref>
<ref id="B16">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Malik</surname> <given-names>A. N.</given-names></name> <name><surname>Godfrey-Faussett</surname> <given-names>P.</given-names></name></person-group> (<year>2005</year>). <article-title>Effects of genetic variability of <italic>Mycobacterium tuberculosis</italic> strains on the presentation of disease</article-title>. <source>Lancet Infect. Dis.</source> <volume>5</volume>, <fpage>174</fpage>&#x02013;<lpage>183</lpage>. <pub-id pub-id-type="doi">10.1016/s1473-3099(05)01310-1</pub-id><pub-id pub-id-type="pmid">15766652</pub-id></citation>
</ref>
<ref id="B17">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McIlwain</surname> <given-names>S.</given-names></name> <name><surname>Tamura</surname> <given-names>K.</given-names></name> <name><surname>Kertesz-Farkas</surname> <given-names>A.</given-names></name> <name><surname>Grant</surname> <given-names>C. E.</given-names></name> <name><surname>Diament</surname> <given-names>B.</given-names></name> <name><surname>Frewen</surname> <given-names>B.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title>Crux: rapid open source protein tandem mass spectrometry analysis</article-title>. <source>J. Proteome Res.</source> <volume>13</volume>, <fpage>4488</fpage>&#x02013;<lpage>4491</lpage>. <pub-id pub-id-type="doi">10.1021/pr500741y</pub-id><pub-id pub-id-type="pmid">25182276</pub-id></citation>
</ref>
<ref id="B18">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McKinney</surname> <given-names>J. D.</given-names></name> <name><surname>zu Bentrup</surname> <given-names>K. H.</given-names></name> <name><surname>Mu&#x000F1;oz-Elias</surname> <given-names>E. J.</given-names></name> <name><surname>Miczak</surname> <given-names>A.</given-names></name> <name><surname>Chen</surname> <given-names>B.</given-names></name> <name><surname>Chan</surname> <given-names>W.-T.</given-names></name> <etal/></person-group>. (<year>2000</year>). <article-title>Persistence of <italic>Mycobacterium tuberculosis</italic> in macrophages and mice requires the glyoxylate shunt enzyme isocitrate lyase</article-title>. <source>Nature</source> <volume>406</volume>, <fpage>735</fpage>&#x02013;<lpage>738</lpage>. <pub-id pub-id-type="doi">10.1038/35021074</pub-id><pub-id pub-id-type="pmid">10963599</pub-id></citation>
</ref>
<ref id="B19">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Merker</surname> <given-names>M.</given-names></name> <name><surname>Blin</surname> <given-names>C.</given-names></name> <name><surname>Mona</surname> <given-names>S.</given-names></name> <name><surname>Duforet-Frebourg</surname> <given-names>N.</given-names></name> <name><surname>Lecher</surname> <given-names>S.</given-names></name> <name><surname>Willery</surname> <given-names>E.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Evolutionary history and global spread of the <italic>Mycobacterium tuberculosis</italic> Beijing lineage</article-title>. <source>Nat. Genet.</source> <volume>47</volume>, <fpage>242</fpage>&#x02013;<lpage>249</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3195</pub-id><pub-id pub-id-type="pmid">25599400</pub-id></citation>
</ref>
<ref id="B20">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nicol</surname> <given-names>M. P.</given-names></name> <name><surname>Wilkinson</surname> <given-names>R. J.</given-names></name></person-group> (<year>2008</year>). <article-title>The clinical consequences of strain diversity in <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Trans. R. Soc. Tropical Med. Hygiene</source> <volume>102</volume>, <fpage>955</fpage>&#x02013;<lpage>965</lpage>. <pub-id pub-id-type="doi">10.1016/j.trstmh.2008.03.025</pub-id><pub-id pub-id-type="pmid">18513773</pub-id></citation>
</ref>
<ref id="B21">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parwati</surname> <given-names>I.</given-names></name> <name><surname>van Crevel</surname> <given-names>R.</given-names></name> <name><surname>van Soolingen</surname> <given-names>D.</given-names></name></person-group> (<year>2010</year>). <article-title>Possible underlying mechanisms for successful emergence of the <italic>Mycobacterium tuberculosis</italic> Beijing genotype strains</article-title>. <source>Lancet Infect. Dis.</source> <volume>10</volume>, <fpage>103</fpage>&#x02013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1016/S1473-3099(09)70330-5</pub-id><pub-id pub-id-type="pmid">20113979</pub-id></citation>
</ref>
<ref id="B22">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pillay</surname> <given-names>M.</given-names></name> <name><surname>Sturm</surname> <given-names>A. W.</given-names></name></person-group> (<year>2007</year>). <article-title>Evolution of the extensively drug-resistant F15/LAM4/KZN strain of <italic>Mycobacterium tuberculosis</italic> in KwaZulu-Natal, South Africa</article-title>. <source>Clin. Infect. Dis.</source> <volume>45</volume>, <fpage>1409</fpage>&#x02013;<lpage>1414</lpage>. <pub-id pub-id-type="doi">10.1086/522987</pub-id><pub-id pub-id-type="pmid">17990220</pub-id></citation>
</ref>
<ref id="B23">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ribeiro</surname> <given-names>S. C.</given-names></name> <name><surname>Gomes</surname> <given-names>L. L.</given-names></name> <name><surname>Amaral</surname> <given-names>E. P.</given-names></name> <name><surname>Andrade</surname> <given-names>M. R.</given-names></name> <name><surname>Almeida</surname> <given-names>F. M.</given-names></name> <name><surname>Rezende</surname> <given-names>A. L.</given-names></name> <etal/></person-group>. (<year>2014</year>). <article-title><italic>Mycobacterium tuberculosis</italic> strains of the modern sublineage of the Beijing family are more likely to display increased virulence than strains of the ancient sublineage</article-title>. <source>J. Clin. Microbiol.</source> <volume>52</volume>, <fpage>2615</fpage>&#x02013;<lpage>2624</lpage>. <pub-id pub-id-type="doi">10.1128/JCM.00498-14</pub-id><pub-id pub-id-type="pmid">24829250</pub-id></citation>
</ref>
<ref id="B24">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sala</surname> <given-names>A.</given-names></name> <name><surname>Bordes</surname> <given-names>P.</given-names></name> <name><surname>Genevaux</surname> <given-names>P.</given-names></name></person-group> (<year>2014</year>). <article-title>Multiple toxin-antitoxin systems in <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Toxins</source> <volume>6</volume>, <fpage>1002</fpage>&#x02013;<lpage>1020</lpage>. <pub-id pub-id-type="doi">10.3390/toxins6031002</pub-id><pub-id pub-id-type="pmid">24662523</pub-id></citation>
</ref>
<ref id="B25">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sarkar</surname> <given-names>R.</given-names></name> <name><surname>Lenders</surname> <given-names>L.</given-names></name> <name><surname>Wilkinson</surname> <given-names>K. A.</given-names></name> <name><surname>Wilkinson</surname> <given-names>R. J.</given-names></name> <name><surname>Nicol</surname> <given-names>M. P.</given-names></name></person-group> (<year>2012</year>). <article-title>Modern lineages of <italic>Mycobacterium tuberculosis</italic> exhibit lineage-specific patterns of growth and cytokine induction in human monocyte-derived macrophages</article-title>. <source>PLoS ONE</source> <volume>7</volume>:<fpage>e43170</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0043170</pub-id><pub-id pub-id-type="pmid">22916219</pub-id></citation>
</ref>
<ref id="B26">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sassetti</surname> <given-names>C. M.</given-names></name> <name><surname>Boyd</surname> <given-names>D. H.</given-names></name> <name><surname>Rubin</surname> <given-names>E. J.</given-names></name></person-group> (<year>2003</year>). <article-title>Genes required for mycobacterial growth defined by high density mutagenesis</article-title>. <source>Mol. Microbiol.</source> <volume>48</volume>, <fpage>77</fpage>&#x02013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-2958.2003.03425.x</pub-id><pub-id pub-id-type="pmid">12657046</pub-id></citation>
</ref>
<ref id="B27">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schubert</surname> <given-names>O. T.</given-names></name> <name><surname>Ludwig</surname> <given-names>C.</given-names></name> <name><surname>Kogadeeva</surname> <given-names>M.</given-names></name> <name><surname>Zimmermann</surname> <given-names>M.</given-names></name> <name><surname>Rosenberger</surname> <given-names>G.</given-names></name> <name><surname>Gengenbacher</surname> <given-names>M.</given-names></name> <etal/></person-group>. (<year>2015</year>). <article-title>Absolute proteome composition and dynamics during dormancy and resuscitation of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Cell Host Microbe</source> <volume>18</volume>, <fpage>96</fpage>&#x02013;<lpage>108</lpage>. <pub-id pub-id-type="doi">10.1016/j.chom.2015.06.001</pub-id><pub-id pub-id-type="pmid">26094805</pub-id></citation>
</ref>
<ref id="B28">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schubert</surname> <given-names>O. T.</given-names></name> <name><surname>Mouritsen</surname> <given-names>J.</given-names></name> <name><surname>Ludwig</surname> <given-names>C.</given-names></name> <name><surname>R&#x000F6;st</surname> <given-names>H. L.</given-names></name> <name><surname>Rosenberger</surname> <given-names>G.</given-names></name> <name><surname>Arthur</surname> <given-names>P. K.</given-names></name> <etal/></person-group>. (<year>2013</year>). <article-title>The Mtb proteome library: a resource of assays to quantify the complete proteome of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Cell Host Microbe</source> <volume>13</volume>, <fpage>602</fpage>&#x02013;<lpage>612</lpage>. <pub-id pub-id-type="doi">10.1016/j.chom.2013.04.008</pub-id><pub-id pub-id-type="pmid">23684311</pub-id></citation>
</ref>
<ref id="B29">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shimono</surname> <given-names>N.</given-names></name> <name><surname>Morici</surname> <given-names>L.</given-names></name> <name><surname>Casali</surname> <given-names>N.</given-names></name> <name><surname>Cantrell</surname> <given-names>S.</given-names></name> <name><surname>Sidders</surname> <given-names>B.</given-names></name> <name><surname>Ehrt</surname> <given-names>S.</given-names></name> <etal/></person-group>. (<year>2003</year>). <article-title>Hypervirulent mutant of <italic>Mycobacterium tuberculosis</italic> resulting from disruption of the mce1 operon</article-title>. <source>Proc. Natl. Acad. Sci. U.S.A.</source> <volume>100</volume>, <fpage>15918</fpage>&#x02013;<lpage>15923</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.2433882100</pub-id><pub-id pub-id-type="pmid">14663145</pub-id></citation>
</ref>
<ref id="B30">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shteynberg</surname> <given-names>D.</given-names></name> <name><surname>Nesvizhskii</surname> <given-names>A. I.</given-names></name> <name><surname>Moritz</surname> <given-names>R. L.</given-names></name> <name><surname>Deutsch</surname> <given-names>E. W.</given-names></name></person-group> (<year>2013</year>). <article-title>Combining results of multiple search engines in proteomics</article-title>. <source>Mol. Cell. Proteomics</source> <volume>12</volume>, <fpage>2383</fpage>&#x02013;<lpage>2393</lpage>. <pub-id pub-id-type="doi">10.1074/mcp.R113.027797</pub-id><pub-id pub-id-type="pmid">23720762</pub-id></citation>
</ref>
<ref id="B31">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sun</surname> <given-names>S.</given-names></name> <name><surname>Meyer-Arendt</surname> <given-names>K.</given-names></name> <name><surname>Eichelberger</surname> <given-names>B.</given-names></name> <name><surname>Brown</surname> <given-names>R.</given-names></name> <name><surname>Yen</surname> <given-names>C.-Y.</given-names></name> <name><surname>Old</surname> <given-names>W. M.</given-names></name> <etal/></person-group>. (<year>2007</year>). <article-title>Improved validation of peptide MS/MS assignments using spectral intensity prediction</article-title>. <source>Mol. Cell Proteomics</source> <volume>6</volume>, <fpage>1</fpage>&#x02013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.1074/mcp.M600320-MCP200</pub-id><pub-id pub-id-type="pmid">17018520</pub-id></citation>
</ref>
<ref id="B32">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vandal</surname> <given-names>O. H.</given-names></name> <name><surname>Roberts</surname> <given-names>J. A.</given-names></name> <name><surname>Odaira</surname> <given-names>T.</given-names></name> <name><surname>Schnappinger</surname> <given-names>D.</given-names></name> <name><surname>Nathan</surname> <given-names>C. F.</given-names></name> <name><surname>Ehrt</surname> <given-names>S.</given-names></name></person-group> (<year>2009</year>). <article-title>Acid-susceptible mutants of <italic>Mycobacterium tuberculosis</italic> share hypersusceptibility to cell wall and oxidative stress and to the host environment</article-title>. <source>J. Bacteriol.</source> <volume>191</volume>, <fpage>625</fpage>&#x02013;<lpage>631</lpage>. <pub-id pub-id-type="doi">10.1128/JB.00932-08</pub-id><pub-id pub-id-type="pmid">19011036</pub-id></citation>
</ref>
<ref id="B33">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vizca&#x000ED;no</surname> <given-names>J. A.</given-names></name> <name><surname>Csordas</surname> <given-names>A.</given-names></name> <name><surname>del-Toro</surname> <given-names>N.</given-names></name> <name><surname>Dianes</surname> <given-names>J. A.</given-names></name> <name><surname>Griss</surname> <given-names>J.</given-names></name> <name><surname>Lavidas</surname> <given-names>I.</given-names></name> <etal/></person-group>. (<year>2016</year>). <article-title>2016 update of the PRIDE database and its related tools</article-title>. <source>Nucleic Acids Res.</source> <volume>44</volume>, <fpage>D447</fpage>&#x02013;<lpage>D456</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkv1145</pub-id><pub-id pub-id-type="pmid">26527722</pub-id></citation>
</ref>
<ref id="B34">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>J.</given-names></name> <name><surname>Behr</surname> <given-names>M. A.</given-names></name></person-group> (<year>2014</year>). <article-title>Building a better bacillus: the emergence of <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Front. Microbiol.</source> <volume>5</volume>:<issue>139</issue>. <pub-id pub-id-type="doi">10.3389/fmicb.2014.00139</pub-id><pub-id pub-id-type="pmid">24765091</pub-id></citation>
</ref>
<ref id="B35">
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Warner</surname> <given-names>D. F.</given-names></name> <name><surname>Koch</surname> <given-names>A.</given-names></name> <name><surname>Mizrahi</surname> <given-names>V.</given-names></name></person-group> (<year>2015</year>). <article-title>Diversity and disease pathogenesis in <italic>Mycobacterium tuberculosis</italic></article-title>. <source>Trends Microbiol.</source> <volume>23</volume>, <fpage>14</fpage>&#x02013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1016/j.tim.2014.10.005</pub-id><pub-id pub-id-type="pmid">25468790</pub-id></citation>
</ref>
</ref-list>
<fn-group>
<fn id="fn0001"><p><sup>1</sup><ext-link ext-link-type="uri" xlink:href="http://www.sanger.ac.uk/science/tools/mascotpercolator">http://www.sanger.ac.uk/science/tools/mascotpercolator</ext-link></p></fn>
</fn-group>
</back>
</article>