<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Cell. Infect. Microbiol.</journal-id>
<journal-title>Frontiers in Cellular and Infection Microbiology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Cell. Infect. Microbiol.</abbrev-journal-title>
<issn pub-type="epub">2235-2988</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fcimb.2023.1306368</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Cellular and Infection Microbiology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Deciphering complex antibiotic resistance patterns in <italic>Helicobacter pylori</italic> through whole genome sequencing and machine learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Yu</surname>
<given-names>Jianwei</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Jia</surname>
<given-names>Yan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Yu</surname>
<given-names>Qichao</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2574582"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" equal-contrib="yes">
<name>
<surname>Lin</surname>
<given-names>Lan</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="author-notes" rid="fn003">
<sup>&#x2020;</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Chao</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Bowang</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/490808"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhong</surname>
<given-names>Pingyu</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lin</surname>
<given-names>Xueqing</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Huilan</given-names>
</name>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sun</surname>
<given-names>Yinping</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhong</surname>
<given-names>Xuejing</given-names>
</name>
<xref ref-type="aff" rid="aff9">
<sup>9</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>He</surname>
<given-names>Yuqi</given-names>
</name>
<xref ref-type="aff" rid="aff10">
<sup>10</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Huang</surname>
<given-names>Xiaoyun</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/432446"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Lin</surname>
<given-names>Shuangming</given-names>
</name>
<xref ref-type="aff" rid="aff11">
<sup>11</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Pan</surname>
<given-names>Yuanming</given-names>
</name>
<xref ref-type="aff" rid="aff12">
<sup>12</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2180417"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Gastroenterology, Longyan First Affiliated Hospital of Fujian Medical University</institution>, <addr-line>Longyan, Fujian</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Gastroenterology, the 7Medical Center of PLA General Hospital</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Center for Systems Biology, Intelliphecy, Main Building, Beishan Industrial Zone</institution>, <addr-line>Shenzhen, Guangdong</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>College of Life Sciences, University of Chinese Academy of Sciences</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Gastroenterology, Xiamen Humanity Hospital</institution>, <addr-line>Xiamen, Fujian</addr-line>, <country>China</country>
</aff>
<aff id="aff6">
<sup>6</sup>
<institution>Department of Gastroenterology, Peking University Aerospace School of Clinical Medicine</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff7">
<sup>7</sup>
<institution>Department of Data Science, Intelliphecy</institution>, <addr-line>Nanjing, Jiangsu</addr-line>, <country>China</country>
</aff>
<aff id="aff8">
<sup>8</sup>
<institution>Department of Nephrology, Longyan First Affiliated Hospital of Fujian Medical University</institution>, <addr-line>Longyan, Fujian</addr-line>, <country>China</country>
</aff>
<aff id="aff9">
<sup>9</sup>
<institution>Department of Science and Education, Longyan First Affiliated Hospital of Fujian Medical University</institution>, <addr-line>Longyan, Fujian</addr-line>, <country>China</country>
</aff>
<aff id="aff10">
<sup>10</sup>
<institution>Department of Gastroenterology, Beijing Chest Hospital, Capital Medical University, Beijing Tuberculosis and Thoracic Tumor Research Institute</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<aff id="aff11">
<sup>11</sup>
<institution>Department of Gastrointestinal Surgery, Longyan First Affiliated Hospital of Fujian Medical University</institution>, <addr-line>Longyan, Fujian</addr-line>, <country>China</country>
</aff>
<aff id="aff12">
<sup>12</sup>
<institution>Cancer Research Center, Beijing Chest Hospital, Capital Medical University, Beijing Tuberculosis and Thoracic Tumor Research Institute</institution>, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Shira Lynn Broschat, Washington State University, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Abu Sayed Chowdhury, National Marrow Donor Program, United States</p>
<p>Zhila Esna Ashari, Washington State University, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Yuanming Pan, <email xlink:href="mailto:peterfpan2020@mail.ccmu.edu.cn">peterfpan2020@mail.ccmu.edu.cn</email>; Shuangming Lin, <email xlink:href="mailto:doclin369@aliyun.com">doclin369@aliyun.com</email>; Xiaoyun Huang, <email xlink:href="mailto:x.huang@intelliphecy.com">x.huang@intelliphecy.com</email>
</p>
</fn>
<fn fn-type="equal" id="fn003">
<p>&#x2020;These authors have contributed equally to this work</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>04</day>
<month>01</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>13</volume>
<elocation-id>1306368</elocation-id>
<history>
<date date-type="received">
<day>03</day>
<month>10</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>06</day>
<month>12</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Yu, Jia, Yu, Lin, Li, Chen, Zhong, Lin, Li, Sun, Zhong, He, Huang, Lin and Pan</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Yu, Jia, Yu, Lin, Li, Chen, Zhong, Lin, Li, Sun, Zhong, He, Huang, Lin and Pan</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<sec>
<title>Introduction</title>
<p>Helicobacter pylori (H.pylori, Hp) affects billions of people worldwide. However, the emerging resistance of Hp to antibiotics challenges the effectiveness of current treatments. Investigating the genotype-phenotype connection for Hp using next-generation sequencing could enhance our understanding of this resistance.</p>
</sec>
<sec>
<title>Methods</title>
<p>In this study, we analyzed 52 Hp strains collected from various hospitals. The susceptibility of these strains to five antibiotics was assessed using the agar dilution assay. Whole-genome sequencing was then performed to screen the antimicrobial resistance (AMR) genotypes of these Hp strains. To model the relationship between drug resistance and genotype, we employed univariate statistical tests, unsupervised machine learning, and supervised machine learning techniques, including the development of support vector machine models.</p>
</sec>
<sec>
<title>Results</title>
<p>Our models for predicting Amoxicillin resistance demonstrated 66% sensitivity and 100% specificity, while those for Clarithromycin resistance showed 100% sensitivity and 100% specificity. These results outperformed the known resistance sites for Amoxicillin (A1834G) and Clarithromycin (A2147), which had sensitivities of 22.2% and 87%, and specificities of 100% and 96%, respectively.</p>
</sec>
<sec>
<title>Discussion</title>
<p>Our study demonstrates that predictive modeling using supervised learning algorithms with feature selection can yield diagnostic models with higher predictive power compared to models relying on single single-nucleotide polymorphism (SNP) sites. This approach significantly contributes to enhancing the precision and effectiveness of antibiotic treatment strategies for Hp infections. The application of whole-genome sequencing for Hp presents a promising pathway for advancing personalized medicine in this context.</p>
</sec>
</abstract>
<kwd-group>
<kwd>antimicrobial resistance (AMR)</kwd>
<kwd>Helicobactor pylori</kwd>
<kwd>genomic sequencing data</kwd>
<kwd>machine learning methods</kwd>
<kwd>molecular mechanism</kwd>
</kwd-group>
<counts>
<fig-count count="7"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="21"/>
<page-count count="14"/>
<word-count count="5897"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Clinical Microbiology</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<title>Introduction</title>
<p>
<italic>Hp</italic> infection as the gram-negative pathogen, was estimated to infect over 50% of the world population, which is the cause for chronic gastritis (<xref ref-type="bibr" rid="B13">Salih, 2009</xref>). There are more evidences of the adverse events of <italic>Hp</italic> infection, patients with chronic <italic>Hp</italic> infection were more likely to have gastric cancer in their lifetime (<xref ref-type="bibr" rid="B20">Wroblewski et&#xa0;al., 2010</xref>), and Combination of antibiotics and mucosa protection drug is the standard of care for <italic>Hp</italic> infected patients. However, antibiotic resistance posed a significant challenge in clinical practice. The resistance of <italic>Hp</italic> to amoxicillin and tetracycline was as high as 9% and 15% respectively in a north China cohort (<xref ref-type="bibr" rid="B18">Wang et&#xa0;al., 2019</xref>). Both amoxicillin and tetracycline were first-line antibiotics used in clinic. Trial and error strategy not only increased cost and treatment time for the patients, but also renders the patients a higher probability of side effects. Antimicrobial susceptibility testing (AST) was adopted in clinic for patients who have failed standard treatment options (<xref ref-type="bibr" rid="B14">Smith et&#xa0;al., 2014</xref>). However, AST was limited by the culturing method and typically required a lengthy time.</p>
<p>Next generation sequencing (NGS) has emerged to be a powerful technology to characterize microbiome in the past decade (<xref ref-type="bibr" rid="B7">Malla et&#xa0;al., 2018</xref>). NGS allows the analysis of microbial composition within a sample and microbial subtyping with in-depth sequencing and SNP calling. NGS derived bacterial genotype has been related to phenotypes under a variety of circumstances (<xref ref-type="bibr" rid="B16">van Opijnen and Camilli, 2012</xref>; <xref ref-type="bibr" rid="B2">Dutilh et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B9">Mousavizadeh and Ghasemi, 2021</xref>). It has been reported that mutations in 23S rRNA were associated with clarithromycin resistance in <italic>Hp</italic> (<xref ref-type="bibr" rid="B17">Versalovic et&#xa0;al., 1996</xref>). Previous studies have shown that phenotypic resistance correlates well with genetic tests, while failed to provide high confidence single locus to accurately describe resistant patterns for different antibiotics (<xref ref-type="bibr" rid="B1">Camorlinga-Ponce et&#xa0;al., 2020</xref>). The inaccuracy of predicting antibiotic resistance was partially attributable to incomplete penetration of mutations in dictating phenotypes. Researchers explored the feasibility to use genotype-based machine learning methods to model the antimicrobial resistance of Actinobacillus pleuropneumoniae from Whole genome sequencing (WGS) data (<xref ref-type="bibr" rid="B6">Liu et&#xa0;al., 2020</xref>). Currently, systemic effort to address the antibiotic resistance of <italic>Hp</italic> using supervised machine learning is still lacking.</p>
<p>In this study, we established a workflow measure the phenotype and genotype of Hp strains, including Hp culturing and single colony picking, disk diffusion test and whole genome sequencing. We interrogated the antibiotic resistance of <italic>Hp</italic> by combining whole genome sequencing and machine learning approach. SNP was determined for Hp strains and used as input for modeling antibiotic resistance, with single SNP modeling, unsupervised and supervised machine learning. The goal is to explore the possibility to use WGS in clinical setting to predict antimicrobial resistance.</p>
</sec>
<sec id="s2" sec-type="results">
<title>Results</title>
<sec id="s2_1">
<title>Summary of patient cohort</title>
<p>A comprehensive summary of the patient cohort enrolled in our study is presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;1</bold>
</xref>. With patient age spanning from 23 to 71 years, the broad age distribution underscores the extensive impact of <italic>Hp</italic> infection across the entire population. The diverse age range vividly reflects the ubiquitous nature of <italic>Hp</italic>&#x2019;s influence. Notably, <italic>Hp</italic> isolates derived from these patients underwent rigorous drug testing to ascertain their susceptibility to six antibiotics, namely Amoxicillin, Clarithromycin, Levofloxacin, Metronidazole, Tetracycline, and Furazolidone. Interestingly, 86.5% of strains (45/52) are resistant to Metronidazole.</p>
<p>The statistic for enrolled patients and analyzed strains are summarized in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;2</bold>
</xref>. The patient cohort included 21/52 (40.4%) male patients and 31/52 (59.6%) female patients. The median age is 50. The rate of resistance are 17.3% for Amoxicillin, 44.2% for Clarithromycin, 38.5% for Levofloxacin and 86.5% for Metronidazole. All strains are sensitive to Furazolidone. Only one strain is resistant to Tetracycline.</p>
<p>To investigate how the genotype information of <italic>Hp</italic> can be used to predict antibiotic resistance, we established a workflow to measure drug sensitivity phenotype using disk diffusion test and genotype using whole genome sequencing (<xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>). The relation between genotype and phenotype was modeled using univariate statistical test, unsupervised machine learning (phylogenetic analysis) and supervised machine learning (support vector machine).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Summary of the workflow. Schematic summary of our study. The phenotype and genotype of <italic>Hp</italic> strains were quantitatively measured and the relationship between <italic>Hp</italic> phenotype and genotype was modeled by univariate analysis, unsupervised clustering and support vector machine.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g001.tif"/>
</fig>
</sec>
<sec id="s2_2">
<title>Overview of SNPs</title>
<p>The pivotal aspect of our investigation involved subjecting <italic>Hp</italic> isolates obtained from the patients to cutting-edge next-generation sequencing. This technological approach facilitated the comprehensive acquisition of whole genome data. To ensure the reliability and quality of our findings, patients lacking accurate clinical data were thoughtfully excluded, as were patients yielding insufficient SNP data due to data quality concerns. Seven patients were excluded because lack of clinical information. Five patients were removed from downstream analysis as the total number of SNP is less than 3000. This stringent curation led to the inclusion of a robust cohort comprising 52 patients. In total, our study unveiled a median of 66,198 SNPs identified among these patients. The significant SNPs for Amoxicillin, Clarithromycin, Levofloxacin, Metronidazole and Tetracycline were summarized in (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Tables&#xa0;3&#x2013;7</bold>
</xref>).</p>
</sec>
<sec id="s2_3">
<title>Modeling approaches</title>
<p>Leveraging this pool of extracted SNPs, we conducted a series of rigorous downstream analyses. These analyses encompassed single SNP statistical tests, the construction of phylogenetic trees, and the implementation of supervised machine learning using Support Vector Machine. This multi-faceted approach allowed us to draw comprehensive insights into the genetic intricacies underpinning antibiotic resistance in <italic>Hp</italic> strains within our patient cohort.</p>
<p>Three modeling approaches were undertaken to address the relationship between antibiotic resistance and genotype, including univariate statistical test, unsupervised machine learning and supervised machine learning. Univariate statistical test serves as a foundational method to identify basic relationships and differences between resistant and sensitive strains. This approach is valuable for its simplicity and clarity, providing an initial understanding of the data. For the unsupervised machine learning component, phylogenetic analysis was employed. Phylogenetic trees facilitates the visualization and clustering of different strains, offering insights into how genetic variations might influence antibiotic resistance. For supervised machine learning, the Support Vector Machine (SVM) algorithm was selected for its effectiveness in classification tasks, especially in high-dimensional spaces. This approach is particularly beneficial when labeled data is available and predictive modeling is desired.</p>
<p>To evaluate the model performance, we used sensitivity and specificity throughout our study. Sensitivity and specificity are two key metrics used to evaluate the performance of a diagnostic test or model. Briefly, in our study sensitivity measures the proportion of actual positives (resistant strains) that are correctly identified by the model. Specificity measures the proportion of actual negatives (sensitive strains) that are correctly identified by the model.</p>
</sec>
<sec id="s2_4">
<title>Prediction of amoxicillin resistance</title>
<p>We identified 2483 significant SNPs for Amoxicillin (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;3</bold>
</xref>), including one significant site on 23S rRNA (A1834G). Using individual SNP for Amoxicillin resistance prediction, we evaluated the model with sensitivity and specificity. In this case the presence of a SNP suggested that the sequenced strain was an Amoxicillin resistant one. This assumption allowed us to determine the sensitivity and specificity of the individual models based on one single SNP site. We plotted the sensitivity and specificity of all resulted models (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2A</bold>
</xref>). The sensitivity ranged from 0 to 1, with a mean sensitivity of 0.45. The specificity also ranged from 0 to 1, with a mean specificity of 0.46. It was difficult to obtain a good tradeoff between model sensitivity and specificity (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2B</bold>
</xref>). For A1834G of 23S rRNA, the model achieved 100% specificity and only 22.2% sensitivity.</p>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>Amoxicillin resistance modeling using phylogenetic tree construction and single SNP classification. <bold>(A)</bold> Phylogenetic tree for Amoxicillin. Amoxicillin resistance is color coded indicating sensitive (Dark Green), resistant (Red), intermediate (Grey) and lowly sensitive (Light Green); Treatment result is color coded indicating Effective (Black) and Failed (Grey); Group is color coded to indicate two different gastric mucosa protection drugs A (Sky Blue) and B (Light Yellow); Gender is color coded to indicate Male (Blue) and Female (Red); Age is color coded to indicated different ranges, with darker color indicating larger age. <bold>(B)</bold> Sensitivity and specificity distribution for the models derived from single SNP site to predict Amoxicillin resistance. <bold>(C)</bold> Relationship between model sensitivity and model specificity was visualized as scatter plot. Blue line is fitted linear model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g002.tif"/>
</fig>
<p>To enhance model performance, we took all 2483 significant sites as input for the construction of phylogenetic tree. The phylogenetic tree indicated that sensitive and resistant strains were well separated (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2C</bold>
</xref>).</p>
</sec>
<sec id="s2_5">
<title>Prediction of clarithromycin resistance</title>
<p>In our investigation, we identified a total of 266 significant SNPs associated with Clarithromycin resistance (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;4</bold>
</xref>), among which a noteworthy site was found on the 23S rRNA gene (A2147G). To predict Clarithromycin resistance, we utilized individual SNPs as predictive markers and assessed the model&#x2019;s performance. The model&#x2019;s effectiveness was evaluated by plotting the sensitivity and specificity of the resulting models (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3A</bold>
</xref>). Sensitivity values ranged from 0 to 1, with a mean sensitivity of 0.4, while specificity values ranged from 0 to 1, with a mean specificity of 0.58. Notably, except for A2147G, achieving a balanced tradeoff between model sensitivity and specificity proved to be challenging (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3B</bold>
</xref>). However, for the specific case of A2147G on the 23S rRNA gene, the model demonstrated 87% sensitivity and 96% specificity.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Clarithromycin resistance modeling using phylogenetic tree construction and single SNP classification. <bold>(A)</bold> Phylogenetic tree for Clarithromycin. Clarithromycin resistance is color coded indicating sensitive (Dark Green), resistant (Red), intermediate (Grey) and lowly sensitive (Light Green); Treatment result is color coded indicating Effective (Black) and Failed (Grey); Group is color coded to indicate two different gastric mucosa protection drugs A (Sky Blue) and B (Light Yellow); Gender is color coded to indicate Male (Blue) and Female (Red); Age is color coded to indicated different ranges, with darker color indicating larger age. <bold>(B)</bold> Sensitivity and specificity distribution for the models derived from single SNP site to predict Clarithromycin resistance. <bold>(C)</bold> Relationship between model sensitivity and model specificity was visualized as scatter plot. Blue line is fitted linear model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g003.tif"/>
</fig>
<p>To further enhance the predictive capabilities of the models, we incorporated all 266 significant SNP sites as input for the construction of a phylogenetic tree. The outcome of this phylogenetic analysis indicated that strains with different sensitivities to Clarithromycin could be distinctly separated (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3C</bold>
</xref>). This result highlighted that through phylogenetic analysis, different strains of Helicobacter pylori were distinctly categorized based on their individual reactions to the antibiotic Clarithromycin, as evidenced by their separation in the phylogenetic tree.</p>
</sec>
<sec id="s2_6">
<title>Prediction of Levofloxacin resistance</title>
<p>We identified a total of 200 significant SNPs associated with Levofloxacin resistance (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;5</bold>
</xref>), among which a significant site was found on the 23S rRNA gene (A2147G). To predict Levofloxacin resistance, we employed individual SNPs as predictive markers and evaluated the model performance. The performance metrics of the resultant models were assessed by plotting sensitivity and specificity (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4A</bold>
</xref>). Sensitivity values ranged from 0 to 1, with a mean of 0.4, while specificity values ranged from 0 to 1, with a mean of 0.58. Interestingly, there appeared to be a negative correlation between sensitivity and specificity (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4B</bold>
</xref>). Notably, the model for A2147G of the 23S rRNA gene achieved 65% sensitivity and 71% specificity.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Levofloxacin resistance modeling using phylogenetic tree construction and single SNP classification. <bold>(A)</bold> Phylogenetic tree for Levofloxacin. Levofloxacin resistance is color coded indicating sensitive (Dark Green), resistant (Red), intermediate (Grey) and lowly sensitive (Light Green); Treatment result is color coded indicating Effective (Black) and Failed (Grey); Group is color coded to indicate two different gastric mucosa protection drugs A (Sky Blue) and B (Light Yellow); Gender is color coded to indicate Male (Blue) and Female (Red); Age is color coded to indicated different ranges, with darker color indicating larger age. <bold>(B)</bold> Sensitivity and specificity distribution for the models derived from single SNP site to predict Levofloxacin resistance. <bold>(C)</bold> Relationship between model sensitivity and model specificity was visualized as scatter plot. Blue line is fitted linear model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g004.tif"/>
</fig>
<p>To maximize the separation in resistant and sensitive strains, we utilized all 200 significant SNP sites as input to construct a phylogenetic tree. The resulting phylogenetic tree exhibited distinct separation between Levofloxacin-sensitive and resistant strains (<xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4C</bold>
</xref>). This phylogenetic analysis provided additional support for the differentiation between bacterial strains based on their Levofloxacin resistance profiles.</p>
</sec>
<sec id="s2_7">
<title>Prediction of Metronidazole resistance</title>
<p>We successfully identified a total of 379 significant SNPs associated with Metronidazole resistance (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table&#xa0;6</bold>
</xref>), among which an important site on the 23S rRNA (G1517A) stood out. Employing individual SNPs for Metronidazole resistance prediction, we evaluated the performance metrics of our models. The sensitivity and specificity of all resulting models were plotted and analyzed (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5A</bold>
</xref>). The spectrum of sensitivity scores ranged between 0 and 1, with an average sensitivity value of 0.41. Correspondingly, specificity scores ranged between 0 and 1, yielding an average specificity of 0.52. Remarkably, one single SNP model emerged as an outlier, achieving nearly 100% sensitivity and an impressive 100% specificity (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5B</bold>
</xref>). However, when focusing on the known G1517A variant of the 23S rRNA, the model exhibited only 2% sensitivity and 50% specificity.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Metronidazole resistance modeling using phylogenetic tree construction and single SNP classification. <bold>(A)</bold> Phylogenetic tree for Metronidazole. Metronidazole resistance is color coded indicating sensitive (Dark Green), resistant (Red), intermediate (Grey) and lowly sensitive (Light Green); Treatment result is color coded indicating Effective (Black) and Failed (Grey); Group is color coded to indicate two different gastric mucosa protection drugs A (Sky Blue) and B (Light Yellow); Gender is color coded to indicate Male (Blue) and Female (Red); Age is color coded to indicated different ranges, with darker color indicating larger age. <bold>(B)</bold> Sensitivity and specificity distribution for the models derived from single SNP site to predict Metronidazole resistance. <bold>(C)</bold> Relationship between model sensitivity and model specificity was visualized as scatter plot. Blue line is fitted linear model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g005.tif"/>
</fig>
<p>For unsupervised clustering of all strains based on SNP information, we leveraged all 379 significant sites as input for the construction of a phylogenetic tree. The resulting tree compellingly demonstrated that Metronidazole-sensitive and resistant strains could be distinctly separated (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5C</bold>
</xref>).</p>
</sec>
<sec id="s2_8">
<title>Assessing clinical treatment outcomes</title>
<p>Furthermore, we conducted a comprehensive investigation into the potential impact of two different gastric mucosal protective agents (Group A and B) on treatment outcomes for <italic>Hp</italic> infections. More information about treatment scheme is documented in method. <italic>Hp</italic> is eradicated in 83.3% of strains treated with A and 85.7% of strains treated with B (<italic>p</italic> = 1). For the eight strains not successfully eradicated by Amoxicillin and Clarithromycin, four strains are resistant to both Amoxicillin and Clarithromycin and the other four stains are resistant to either Amoxicillin (n =2) or Clarithromycin (n =2).</p>
</sec>
<sec id="s2_9">
<title>Prediction of amoxicillin resistance using SVM</title>
<p>Using the known A1834G of 23S rRNA, the univariate model achieved 100% specificity and only 22.2% sensitivity. The mean sensitivity and specificity for single SNP model are only 0.45 and 0.46. All single SNP models with 100% specificity have sensitivity less than 50%. Therefore, we aimed to investigate the application of the supervised machine learning algorithm SVM in developing a predictive model for Amoxicillin resistance. Here we employed all significantly different SNP sites between resistant and sensitive strains to train SVM model. The feature selection procedure reduced the number of dimensions for the classification problem. Through this approach, we successfully generated an SVM model with 100% sensitivity and 100% specificity in predicting sensitive and resistant <italic>Hp</italic> strains (<xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>). For the four strains (two lowly sensitive strains and two intermediate strains regarding Amoxicillin response) not used in model training, the model predicted all four strains as Amoxicillin sensitive.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Support vector machine modeling of Amoxicillin resistance. SNP-patient matrix was displayed as a heatmap, with each row indicating one SNP site and each column one patient. Model Prediction was color coded as Sensitive (Grey) and Resistant (Purple); Group was color coded as gastric mucosa protection drugs A (Light Green) and B (Pink); Treatment outcome was color coded as non-responders (Orange) and Responders (Blue). Amoxicillin sensitivity is color coded as sensitive (Grey), lowly sensitive (Pink), intermediate (Red) and resistant (Dark red); Gender is color coded to indicate male (Blue) and female (Red); Age is color coded from white to Green. The confusion matrix for the entire cohort was also shown.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g006.tif"/>
</fig>
<p>Although this model allows us to obtain a good tradeoff between sensitivity and specificity, it is subjected to potential bias as we have much more variables than observations. To maximize the generalizability of the model, we implemented two validation procedures. In the first procedure, the original dataset was randomly split into training set (60%) and test set (40%). We obtained a model with 66.6% sensitivity and 100% specificity in the test set. In the second procedure, we employed 5-fold cross-validation. All five resulted models displayed 100% specificity, while the maximal sensitivity obtained is 50% in three models.</p>
</sec>
<sec id="s2_10">
<title>Prediction of Clarithromycin resistance using SVM</title>
<p>Using the known A2147G on the 23S rRNA gene, the model to predict Clarithromycin resistance demonstrated 87% sensitivity and 96% specificity. We further asked whether we could improve the model performance if we incorporate all significantly different SNP between Clarithromycin sensitive and resistant strains. Consequently, our investigation delved into the application of a supervised machine learning algorithm, specifically Support Vector Machine (SVM), in the development of a predictive model for Clarithromycin resistance. Remarkably, our efforts yielded a model that achieved 100% sensitivity and 100% specificity in predicting Clarithromycin-sensitive and resistant Hp strains (<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>Support vector machine modeling of Clarithromycin resistance. SNP-patient matrix was displayed as a heatmap, with each row indicating one SNP site and each column one patient. Model Prediction was color coded as Sensitive (Grey) and Resistant (Purple); Group was color coded as gastric mucosa protection drugs A (Light Green) and B (Pink); Treatment outcome was color coded as non-responders (Orange) and Responders (Blue). Clarithromycin sensitivity is color coded as sensitive (Grey), intermediate (Red) and resistant (Dark red); Gender is color coded to indicate male (Blue) and female (Red); Age is color coded from white to Green. The confusion matrix for the entire cohort was also shown.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fcimb-13-1306368-g007.tif"/>
</fig>
<p>Similar to the case of Amoxicillin resistance prediction with SVM, the resulted model strikes a perfect balance of sensitivity and specificity that is subjected to overfitting. The validation was implemented by two procedures. In the split procedure (60% training and 40% test), the model reached 100% sensitivity and 100% specificity in the test data. Using 5-fold cross-validation, all five resulted models exhibited 100% sensitivity and 100% specificity.</p>
</sec>
</sec>
<sec id="s3" sec-type="discussion">
<title>Discussion</title>
<p>Whole genome sequencing had been successfully adopted in the clinic for Mycobacterium tuberculosis (<xref ref-type="bibr" rid="B19">Witney et&#xa0;al., 2016</xref>) and played important roles in identification of mutant strains of SARS-Cov-2 (<xref ref-type="bibr" rid="B10">Oude Munnink et&#xa0;al., 2020</xref>). In our study, we employed a comprehensive whole-genome sequencing approach to unravel the intricate antibiotic resistance patterns of <italic>Hp</italic>. Although antimicrobial resistance in <italic>Hp</italic> is a global threat to human health and the underlying molecular mechanisms have been explored in our study. In contrast to traditional phenotyping methods, which are characterized by their time-consuming nature and notable variability (<xref ref-type="bibr" rid="B3">Gerrits et&#xa0;al., 2006</xref>), our study showcases the remarkable advantages of employing Whole Genome Sequencing (WGS) for the prediction of <italic>Hp</italic> antibiotic resistance. The conventional approach, reliant on bacterial culture and drug testing, often consumes valuable time and yields results that are prone to experimental variation. In stark contrast, WGS offers an efficient, rapid, and precise alternative that holds immense potential in clinical setting.</p>
<p>Our research did not perform an exhaustive comparison between existing methodologies for predicting Helicobacter pylori (<italic>Hp</italic>) resistance and our proposed approach. The primary objective of our study was not to develop an optimal model, but rather to investigate the capabilities of machine learning in predicting Hp resistance. It is important to note that our final model might be subject to overfitting due to the limited size of our dataset, despite implementing cross-validation techniques. Traditional studies employing WGS typically rely on univariate statistical methods. One study frequently analyzed resistance-associated sites through kappa concordance analysis to identify both known and novel Hp resistance loci in WGS data (<xref ref-type="bibr" rid="B21">Zhou et&#xa0;al., 2022</xref>). Another study has concentrated on recognized drug resistance genes, like multidrug-resistant efflux pump genes (<xref ref-type="bibr" rid="B4">Iwamoto et&#xa0;al., 2014</xref>). The prediction of antimicrobial resistance based on WGS and machine learning has been explored using various supervised learning algorithms, particularly in studies involving the whole genome sequencing of Escherichia coli (<xref ref-type="bibr" rid="B11">Ren et&#xa0;al., 2022</xref>). Our study introduces a novel feature selection strategy for constructing machine learning models, diversifying the methodological approaches in this field.</p>
<p>Our findings underscored the challenge of achieving good sensitivity and specificity concurrently with models based on a single SNP site. Notably, a rare exception emerged with the single A2147G mutation on the 23S rRNA, which exhibited high sensitivity and specificity in predicting Clarithromycin resistance. This alignment with previous research corroborates the clear link between Clarithromycin resistance in <italic>Hp</italic> and A2146 and A2147 mutations (<xref ref-type="bibr" rid="B5">Lauener et&#xa0;al., 2019</xref>). We further demonstrated the efficacy of constructing phylogenetic trees based on significant SNP sites, revealing substantial separation between antibiotic-sensitive and resistant strains. These results suggest that future investigations aimed at building predictive models utilizing a combination of SNP sites could be a fruitful avenue to explore.</p>
<p>The complex nature of antimicrobial resistance in <italic>Hp</italic> underscores the limitations of predictive modeling based on single SNP sites (<xref ref-type="bibr" rid="B12">Reygaert, 2018</xref>). For instance, <italic>Hp</italic>&#x2019;s resistance to Levofloxacin is likely linked to gyrase, an enzyme responsible for DNA negative supercoiling. Point mutations at amino acids 87, 88, 91, and 97 have been identified as potential Levofloxacin resistance determinants (<xref ref-type="bibr" rid="B8">Moore et&#xa0;al., 1995</xref>). Nonetheless, our study did not identify a single SNP site with the dual qualities of high sensitivity and specificity in predicting Levofloxacin resistance.</p>
<p>The challenging balance between high sensitivity and specificity for models based on single SNP sites primarily stems from the diverse mechanisms that underlie antibiotic resistance in <italic>Hp</italic>. Despite the promising potential of whole-genome sequencing in clinical medicine, our study does have several limitations. Firstly, our supervised machine learning approach relied on accurate phenotyping through traditional culturing and drug testing, which are susceptible to experimental variations (<xref ref-type="bibr" rid="B15">Su et&#xa0;al., 2019</xref>). Secondly, genome sequencing and drug testing of a single <italic>Hp</italic> colony oversimplify the complex clinical reality, where patients may harbor heterogeneous <italic>Hp</italic> populations within an intricate ecosystem of coexisting microbiota.</p>
<p>The construction of predictive modeling of antibiotic resistance was enhanced by feature selection. Significantly different SNP sites between sensitive and resistant strains were used as model input. In the case of Amoxicillin resistance, the best model has a sensitivity of 66% and a specificity of 100% in test data, while the known A1834G of 23S rRNA achieved 100% specificity and only 22.2% sensitivity. For Clarithromycin resistance, all trained models exhibited 100% sensitivity and 100% specificity in both training data and test data. This improved the performance of the known A2147G on the 23S rRNA gene, which has a sensitivity of 87% and a specificity of 96%. As proof-of-concept, predictive modeling using SVM with feature selection could lead to diagnostic model with higher predictive power.</p>
<p>Our study used sensitivity and specificity to evaluate the diagnostic models derived from different approaches. It&#x2019;s important to note that sensitivity and specificity are inversely related. Increasing one often leads to a decrease in the other. The ideal model would have both high sensitivity and high specificity, but in practice, a balance is usually sought based on the consequences of false positives and false negatives. In a clinical setting, these metrics guide the choice of a diagnostic test based on what is more critical: not missing the condition (high sensitivity) or not incorrectly diagnosing it when it&#x2019;s not there (high specificity). High sensitivity ensures resistant strains are correctly identified and treated.</p>
<p>One major limitation of our study is the small patient cohort. In the case of Amoxicillin drug resistance, we only have nine resistant strains. This limits our ability to train models with low variance. If the test dataset is small, we could have few or no resistant strains for Amoxicillin. In our small cohort, we did not have any resistant strain for Furazolidone and we only had one resistant strain for Tetracycline. This renders it impossible to address Furazolidone or Tetracycline resistance. Nevertheless, our dataset might be used for integration with other accessible datasets in the community for future predictive modeling efforts.</p>
<p>Taken together, the intricate antibiotic resistance patterns revealed by our whole-genome sequencing approach emphasize the need for a holistic perspective in understanding the dynamics of antimicrobial resistance in <italic>Hp</italic>. The lack of single SNP sites with simultaneous high sensitivity and specificity underscores the multifaceted nature of resistance mechanisms that this pathogen employs. As such, the incorporation of supervised machine learning techniques may hold the key to achieving more accurate and reliable predictive models for antibiotic resistance. Our findings emphasize the need for continued multidisciplinary research efforts that bridge genomics, microbiology, machine learning, and clinical medicine.</p>
</sec>
<sec id="s4">
<title>Methods</title>
<sec id="s4_1">
<title>Sample collection and ethical approval</title>
<p>In total we collected sample from 52 patients with <italic>Hp</italic> infections. All enrolled patients have no intake of antibiotics within one month, no consumption of PPI or Chinese traditional medicine within two weeks. UBT test was employed to confirm the positivity of <italic>Hp</italic> infection. Biopsy samples were preserved in cultivation media and transported to laboratory at 4 degree. The studies involving human participants were reviewed and approved by the seventh Medical Center of PLA General Hospital Ethics Committee (No.2017-74) and other departments of gastroenterology from different hospitals applied and followed this content&#x2019;s introduction. The patients/participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s4_2">
<title>Stratification by treatment outcome</title>
<p>Patients were divided into two groups (A and B). The patients in the group A were treated with 1000 mg tid of hydrotalcite, 20 mg bid of rabeprazole, 1000 mg bid of amoxicillin and 500 mg bid of clarithromycin; The patients in group B were treated with colloidal bismuth pectin 300 mg bid + rabeprazole 20 mg bid + amoxicillin 1000 mg bid + clarithromycin 500 mg bid for 10 days. At least 28 days after the end of treatment, all patients received <sup>13</sup>C urea breath test to evaluate and compare the <italic>Hp</italic> eradication rate between two groups.</p>
</sec>
<sec id="s4_3">
<title>
<italic>Hp</italic> culture</title>
<p>Biopsy was inoculated onto Columbia blood agar plates supplemented with designated antibiotics. Inoculation was performed by direct contact of mucosa side and agar. The contact is gentle and even to ensure successful inoculation. Preservation media was applied to evenly cover the whole plate. The biopsy was removed and used in to confirm the presence of <italic>Hp</italic>. Agar plates were incubated in 5% O<sub>2</sub>, 10% CO<sub>2</sub>, 85% N<sub>2</sub> at 37 degree for 3 or 4 days.</p>
</sec>
<sec id="s4_4">
<title>Single colony inoculation and cryo-preservation</title>
<p>
<italic>Hp</italic> colony was validated with morphology (Gram negative) and biochemical assays. Single <italic>Hp</italic> colony was transferred to a new Columbia agar plate and inoculated evenly. After 3-4 days of culture in incubator with 5% O<sub>2</sub>, 10% CO<sub>2</sub>, 85% N<sub>2</sub> at 37 degree, <italic>Hp</italic> colonies were cryo-preserved in -80 degree for next generation sequencing.</p>
</sec>
<sec id="s4_5">
<title>Antibiotic test</title>
<p>Determination of antibiotic sensitivity was performed with disk diffusion test according to standardized Kirby-Bauer procedure. White paper disks containing antibiotics were arranged onto the agar plates. The size of circular zones of poor bacteria growth surrounding paper disks was measured and used to define antibiotic sensitivity using customized thresholds (<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Figure&#xa0;1</bold>
</xref>).</p>
</sec>
<sec id="s4_6">
<title>DNA extraction</title>
<p>DNA extraction was performed with Magen HiPure Bacterial DNA kits. Final DNA output was dissolved in 30 &#x3bc;l TE buffer and analyzed with Qubit (Thermofisher) to determine concentration.</p>
</sec>
<sec id="s4_7">
<title>Library construction and sequencing</title>
<p>10 ng DNA was used for library construction. DNA was fragmented with sonification to obtain fragments of 300 bp. Beads-based selection was performed to select DNA fragments after end repairing and adapter ligation. Library amplification was performed with Super Canace High Fidelity enzyme. Amplified libraries and size selected and purified. Agilent 2100 was used for library QC. The resulted libraries were normalized by molar concentration and sequenced with paired-end 150 bp mode on illumina platform.</p>
</sec>
<sec id="s4_8">
<title>Mutation calling</title>
<p>Our mutation calling process commenced with rigorous quality control measures aimed at eliminating adapters and low-quality reads, ensuring the generation of clean reads. These clean reads were then meticulously aligned to the Helicobacter pylori reference genome, specifically the Helicobacter pylori 26695 genome (accessible at <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/nuccore/AE000511">https://www.ncbi.nlm.nih.gov/nuccore/AE000511</ext-link>) using BWA (v0.7.17) with parameters &#x201c;mem -t 2 -M -Y&#x201d;. The resulting alignment data, in BAM format, was sorted and indexed with samtools (v1.9), which was the basis for mutation calling through the use of bcftools (v1.9) with parameters &#x201c;call -vmO z&#x201d;. To enhance the accuracy of our findings, only SNP sites demonstrating at least 2x coverage across all samples were retained for subsequent analysis. We performed &#x201c;bcftools filter -O v -s LOWQUAL -e &#x2018;\&#x2019;&#x2019;QUAL&lt;10 || FMT/DP &lt;5&#x2019;\&#x2019;&#x2019; &#x2013;SnpGap 5 &#x2013;set-GTs&#x201d; to filter out SNPs of low quality. The resulting SNPs were annotated with Annovar (v191024).</p>
</sec>
<sec id="s4_9">
<title>Identification of significant SNPs</title>
<p>The determination of significant SNPs was achieved via rigorous statistical assessments. Our analysis incorporated two independent statistical tests, namely the Chi-squared test and Fisher&#x2019;s exact test. Employing a stringent approach, only SNPs exhibiting <italic>p</italic>-values below 0.05 in both tests were considered significant and subsequently utilized in our downstream analytical endeavors.</p>
</sec>
<sec id="s4_10">
<title>Calculation of sensitivity and specificity</title>
<p>To gauge the efficacy of our approach for each antibiotic, we formulated confusion matrices specific to each significant SNP. The calculation of Sensitivity involved determining the ratio between true positives and model-predicted positives, while Specificity was calculated as the ratio between true negatives and model-predicted negatives. The confusion matrix is comprised of true positive (TP), false positive (FP), false negative (FN) and true negative (TN). To be precise, the formulars are &#x201c;sensitivity = TP/(TP+FN)&#x201d; and &#x201c;specificity = TN/(TN+FP)&#x201d;. These calculations were executed in the R programming environment.</p>
</sec>
<sec id="s4_11">
<title>Phylogenetic analysis</title>
<p>Phylogenetic trees were constructed using SNP data identified in sample subsets of varying sizes, encompassing 5, 10, 20, 30, 40, and 50 samples, yielding 56671, 22601, 18749, 13938, 10397, and 3470 SNPs, respectively. Furthermore, we also plotted phylogenetic trees using only the significant SNPs identified through the aforementioned statistical tests, providing a comprehensive visual representation of genetic variation. The brief step for phylogenetic analysis is as follows. The SNPs in VCF file were converted to FASTA format and imported to MEGA (v10.2), then maximum likelihood tree was constructed with default parameters. The resulting tree file (nwk fomat) was then imported to an online tool called iTOL (<ext-link ext-link-type="uri" xlink:href="https://itol.embl.de">https://itol.embl.de</ext-link>) for visualization.</p>
</sec>
<sec id="s4_12">
<title>Support vector machine</title>
<p>To train classifier to predict antibiotic sensitivity using SNP information, input data was prepared using significant SNP for antibiotic under investigation. To facilitate the SVM modeling process, SNP data was systematically converted into numeric values, serving as the input for our SVM model. Briefly, input data was a patient-SNP matrix consisting of 0 or 1. SNP value of &#x201c;1&#x201d; suggests a polymorphism (non-wild type status), while SNP value of &#x201c;0&#x201d; indicates same genotype as the reference strain.</p>
<p>For Amoxicillin antibiotic resistance, we had 39 sensitive strains, 9 resistant strains, 2 intermediate strains and 2 lowly-sensitive strains. For Clarithromycin, we had 27 sensitive strains, 23 resistant strains and 2 intermediate strains. As the label &#x201c;intermediate&#x201d; and &#x201c;lowly-sensitive&#x201d; had very few observations, we aimed to build the two class SVM classifier using only sensitive and resistant strains. As for Clarithromycine, we had 27 sensitive strains, 23 resistant strains and 2 intermediate strains. Only sensitive and resistant strains were used for SVM.</p>
<p>The implementation of Support Vector Machine (SVM) modeling was facilitated through the e1017 package in the R programming environment. Employing a &#x201c;radial&#x201d; kernel, with a cost set at &#x201c;1&#x201d; for optimal SVM performance, we ensured model reproducibility by utilizing set.seed before the SVM modeling process. Sensitivity and specificity metrics were calculated using the above mentioned formulars: &#x201c;sensitivity = TP/(TP+FN)&#x201d; and &#x201c;specificity = TN/(TN+FP)&#x201d;.</p>
<p>In the model validation process for the Support Vector Machine (SVM) analysis, two distinct validation procedures were implemented to ensure the robustness and reliability of the model. The first procedure involved partitioning the original dataset into two subsets: 60% of the data was used as the training set, where the SVM model was trained to understand the patterns and relationships in the data. The remaining 40% constituted the test set, which was utilized to evaluate the model&#x2019;s performance, specifically its ability to accurately predict outcomes on new, unseen data. This approach of splitting the dataset provides a straightforward way to check the model&#x2019;s efficacy and generalizability.</p>
<p>The second procedure employed was 5-fold cross-validation, a more rigorous validation technique. In this method, the dataset was divided into five equal parts. In each of the five iterations of the process, a different fold was used as the validation set, while the remaining four folds collectively served as the training set. This cycle ensured that each part of the dataset was used both for training and validation. Cross-validation is particularly valuable as it mitigates the risk of overfitting, ensuring the model&#x2019;s performance is not overly tailored to a specific subset of data. By averaging the results from all five folds, a more comprehensive and reliable assessment of the model&#x2019;s performance is obtained, enhancing confidence in its predictive accuracy. Together, these two validation procedures provide a thorough examination of the SVM model&#x2019;s capabilities, contributing to its credibility and applicability in practical scenarios.</p>
</sec>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>All the raw Hp WGS data and SNP results were uploaded to the public repository zenodo (doi:<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.10369064">10.5281/zenodo.10369064</ext-link>), can be accessed via the url: <ext-link ext-link-type="uri" xlink:href="https://zenodo.org/records/10369064">https://zenodo.org/records/10369064</ext-link>. Further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s6" sec-type="ethics-statement">
<title>Ethics statement</title>
<p>The studies involving humans were approved by No.2017-74 ethical identification from the 7th Medical Center of PLA General Hospital. The studies were conducted in accordance with the local legislation and institutional requirements. Written informed consent for participation in this study was provided by the participants&#x2019; legal guardians/next of kin.</p>
</sec>
<sec id="s7" sec-type="author-contributions">
<title>Author contributions</title>
<p>JY: Data curation, Funding acquisition, Investigation, Project administration, Resources, Supervision, Writing &#x2013; original draft, Formal Analysis. YJ: Data curation, Formal Analysis, Investigation, Project administration, Resources, Supervision, Writing &#x2013; review &amp; editing, Conceptualization. QY: Data curation, Methodology, Software, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. LL: Data curation, Investigation, Project administration, Resources, Writing &#x2013; review &amp; editing. CL: Conceptualization, Data curation, Investigation, Project administration, Resources, Writing &#x2013; review &amp; editing. BC: Methodology, Software, Supervision, Validation, Writing &#x2013; review &amp; editing. PZ: Data curation, Formal Analysis, Project administration, Writing &#x2013; review &amp; editing. XL: Conceptualization, Data curation, Formal Analysis, Investigation, Resources, Writing &#x2013; review &amp; editing. HL: Formal Analysis, Investigation, Methodology, Resources, Writing &#x2013; review &amp; editing. YS: Data curation, Formal Analysis, Resources, Validation, Writing &#x2013; review &amp; editing. XZ: Conceptualization, Data curation, Methodology, Writing &#x2013; review &amp; editing. YH: Data curation, Formal Analysis, Investigation, Methodology, Resources, Validation, Writing &#x2013; review &amp; editing.&#xa0;XH: Investigation, Methodology, Software, Supervision, Validation,&#xa0;Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. SL:&#xa0;Conceptualization, Data curation, Funding acquisition, Investigation, Resources, Writing &#x2013; review &amp; editing. YP: Conceptualization, Methodology, Project administration, Resources, Supervision, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s8" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This study was supported by grants from Longyan City Science and Technology Plan Project (Grant number: 2022LYF17082) and Fujian Province Natural Science Foundation (Grant number: 2021J011439).</p>
</sec>
<sec id="s9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fcimb.2023.1306368/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fcimb.2023.1306368/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table_1.xlsx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet"/>
<supplementary-material xlink:href="Image_1.pdf" id="SM1" mimetype="application/pdf"/>
</sec>
<fn-group>
<title>Abbreviations</title>
<fn fn-type="abbr">
<p>AMR, Antimicrobial Resistance; AST, Antimicrobial susceptibility testing; NGS, Next-generation sequencing; <italic>Hp</italic>, <italic>Helicobacter pylori</italic>; GATK, Genomic Analysis Toolkit; SNP, Single-Nucleotide Polymorphism<bold>;</bold> SVM, Support Vector Machine; QC, Quality Control.</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Camorlinga-Ponce</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Gomez-Delgado</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Aguilar-Zamora</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Torres</surname> <given-names>R. C.</given-names>
</name>
<name>
<surname>Giono-Cerezo</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Escobar-Ogaz</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Phenotypic and genotypic antibiotic resistance patterns in helicobacter pylori strains from ethnically diverse population in Mexico</article-title>. <source>Front. Cell Infect. Microbiol.</source> <volume>10</volume>, <elocation-id>539115</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fcimb.2020.539115</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dutilh</surname> <given-names>B. E.</given-names>
</name>
<name>
<surname>Backus</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Edwards</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Wels</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Bayjanov</surname> <given-names>J. R.</given-names>
</name>
<name>
<surname>van Hijum</surname> <given-names>S. A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Explaining microbial phenotypes on a genomic scale: GWAS for microbes</article-title>. <source>Brief Funct. Genomics</source> <volume>12</volume> (<issue>4</issue>), <fpage>366</fpage>&#x2013;<lpage>380</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bfgp/elt008</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gerrits</surname> <given-names>M. M.</given-names>
</name>
<name>
<surname>van Vliet</surname> <given-names>A. H.</given-names>
</name>
<name>
<surname>Kuipers</surname> <given-names>E. J.</given-names>
</name>
<name>
<surname>Kusters</surname> <given-names>J. G.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Helicobacter pylori and antimicrobial resistance: molecular mechanisms and clinical implications</article-title>. <source>Lancet Infect. Dis.</source> <volume>6</volume> (<issue>11</issue>), <fpage>699</fpage>&#x2013;<lpage>709</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S1473-3099(06)70627-2</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iwamoto</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Tanahashi</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Okada</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Yoshida</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Kikuchi</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Keida</surname> <given-names>Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2014</year>). <article-title>Whole-genome sequencing of clarithromycin resistant Helicobacter pylori characterizes unidentified variants of multidrug resistant efflux pump genes</article-title>. <source>Gut Pathog.</source> <volume>6</volume>, <fpage>27</fpage>. doi: <pub-id pub-id-type="doi">10.1186/1757-4749-6-27</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lauener</surname> <given-names>F. N.</given-names>
</name>
<name>
<surname>Imkamp</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Lehours</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Buissonniere</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Benejat</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Zbinden</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Genetic determinants and prediction of antibiotic resistance phenotypes in helicobacter pylori</article-title>. <source>J. Clin. Med.</source> <volume>8</volume> (<issue>1</issue>), <page-range>1&#x2013;14</page-range>. doi: <pub-id pub-id-type="doi">10.3390/jcm8010053</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lv</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Evaluation of machine learning models for predicting antimicrobial resistance of actinobacillus pleuropneumoniae from whole genome sequences</article-title>. <source>Front. Microbiol.</source> <volume>11</volume>, <elocation-id>48</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fmicb.2020.00048</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Malla</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Dubey</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Yadav</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Hashem</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Abd Allah</surname> <given-names>E. F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Exploring the human microbiome: the potential future role of next-generation sequencing in disease diagnosis and treatment</article-title>. <source>Front. Immunol.</source> <volume>9</volume>, <elocation-id>2868</elocation-id>. doi: <pub-id pub-id-type="doi">10.3389/fimmu.2018.02868</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moore</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Beckthold</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Wong</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Kureishi</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Bryan</surname> <given-names>L. E.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Nucleotide sequence of the gyrA gene and characterization of ciprofloxacin-resistant mutants of Helicobacter pylori</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>39</volume> (<issue>1</issue>), <fpage>107</fpage>&#x2013;<lpage>111</lpage>. doi: <pub-id pub-id-type="doi">10.1128/AAC.39.1.107</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mousavizadeh</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Ghasemi</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Genotype and phenotype of COVID-19: Their roles in pathogenesis</article-title>. <source>J. Microbiol. Immunol. Infect.</source> <volume>54</volume> (<issue>2</issue>), <fpage>159</fpage>&#x2013;<lpage>163</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.jmii.2020.03.022</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oude Munnink</surname> <given-names>B. B.</given-names>
</name>
<name>
<surname>Nieuwenhuijse</surname> <given-names>D. F.</given-names>
</name>
<name>
<surname>Stein</surname> <given-names>M.</given-names>
</name>
<name>
<surname>O'Toole</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Haverkate</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Mollers</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Rapid SARS-CoV-2 whole-genome sequencing and analysis for informed public health decision-making in the Netherlands</article-title>. <source>Nat. Med.</source> <volume>26</volume> (<issue>9</issue>), <fpage>1405</fpage>&#x2013;<lpage>1410</lpage>. doi: <pub-id pub-id-type="doi">10.1038/s41591-020-0997-y</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ren</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Chakraborty</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Doijad</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Falgenhauer</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Falgenhauer</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Goesmann</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>Prediction of antimicrobial resistance based on whole-genome sequencing and machine learning</article-title>. <source>Bioinformatics</source> <volume>38</volume> (<issue>2</issue>), <fpage>325</fpage>&#x2013;<lpage>334</lpage>. doi: <pub-id pub-id-type="doi">10.1093/bioinformatics/btab681</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reygaert</surname> <given-names>W. C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>An overview of the antimicrobial resistance mechanisms of bacteria</article-title>. <source>AIMS Microbiol.</source> <volume>4</volume> (<issue>3</issue>), <fpage>482</fpage>&#x2013;<lpage>501</lpage>. doi: <pub-id pub-id-type="doi">10.3934/microbiol.2018.3.482</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Salih</surname> <given-names>B. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Helicobacter pylori infection in developing countries: the burden for how long</article-title>? <source>Saudi J. Gastroenterol.</source> <volume>15</volume> (<issue>3</issue>), <fpage>201</fpage>&#x2013;<lpage>207</lpage>. doi: <pub-id pub-id-type="doi">10.4103/1319-3767.54743</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname> <given-names>S. M.</given-names>
</name>
<name>
<surname>O'Morain</surname> <given-names>C.</given-names>
</name>
<name>
<surname>McNamara</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Antimicrobial susceptibility testing for Helicobacter pylori in times of increasing antibiotic resistance</article-title>. <source>World J. Gastroenterol.</source> <volume>20</volume> (<issue>29</issue>), <fpage>9912</fpage>&#x2013;<lpage>9921</lpage>. doi: <pub-id pub-id-type="doi">10.3748/wjg.v20.i29.9912</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Satola</surname> <given-names>S. W.</given-names>
</name>
<name>
<surname>Read</surname> <given-names>T. D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Genome-based prediction of bacterial antibiotic resistance</article-title>. <source>J. Clin. Microbiol.</source> <volume>57</volume> (<issue>3</issue>), <page-range>1&#x2013;15</page-range>. doi: <pub-id pub-id-type="doi">10.1128/JCM.01405-18</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>van Opijnen</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Camilli</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>A fine scale phenotype-genotype virulence map of a bacterial pathogen</article-title>. <source>Genome Res.</source> <volume>22</volume> (<issue>12</issue>), <fpage>2541</fpage>&#x2013;<lpage>2551</lpage>. doi: <pub-id pub-id-type="doi">10.1101/gr.137430.112</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Versalovic</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Shortridge</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Kibler</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Griffy</surname> <given-names>M. V.</given-names>
</name>
<name>
<surname>Beyer</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Flamm</surname> <given-names>R. K.</given-names>
</name>
<etal/>
</person-group>. (<year>1996</year>). <article-title>Mutations in 23S rRNA are associated with clarithromycin resistance in Helicobacter pylori</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>40</volume> (<issue>2</issue>), <fpage>477</fpage>&#x2013;<lpage>480</lpage>. doi: <pub-id pub-id-type="doi">10.1128/AAC.40.2.477</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Guo</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Yuan</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Gong</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The antibiotic resistance of Helicobacter pylori to five antibiotics and influencing factors in an area of China with a high risk of gastric cancer</article-title>. <source>BMC Microbiol.</source> <volume>19</volume> (<issue>1</issue>), <fpage>152</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12866-019-1517-4</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Witney</surname> <given-names>A. A.</given-names>
</name>
<name>
<surname>Cosgrove</surname> <given-names>C. A.</given-names>
</name>
<name>
<surname>Arnold</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hinds</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Stoker</surname> <given-names>N. G.</given-names>
</name>
<name>
<surname>Butcher</surname> <given-names>P. D.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Clinical use of whole genome sequencing for Mycobacterium tuberculosis</article-title>. <source>BMC Med.</source> <volume>14</volume>, <fpage>46</fpage>. doi: <pub-id pub-id-type="doi">10.1186/s12916-016-0598-2</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wroblewski</surname> <given-names>L. E.</given-names>
</name>
<name>
<surname>Peek</surname> <given-names>R. M.</given-names> <suffix>Jr.</suffix>
</name>
<name>
<surname>Wilson</surname> <given-names>K. T.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Helicobacter pylori and gastric cancer: factors that modulate disease risk</article-title>. <source>Clin. Microbiol. Rev.</source> <volume>23</volume> (<issue>4</issue>), <fpage>713</fpage>&#x2013;<lpage>739</lpage>. doi: <pub-id pub-id-type="doi">10.1128/CMR.00011-10</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhong</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2022</year>). <article-title>A survey of helicobacter pylori antibiotic-resistant genotypes and strain lineages by whole-genome sequencing in China</article-title>. <source>Antimicrob. Agents Chemother.</source> <volume>66</volume> (<issue>6</issue>), <elocation-id>e0218821</elocation-id>. doi: <pub-id pub-id-type="doi">10.1128/aac.02188-21</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>