<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mol. Biosci.</journal-id>
<journal-title>Frontiers in Molecular Biosciences</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mol. Biosci.</abbrev-journal-title>
<issn pub-type="epub">2296-889X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">737821</article-id>
<article-id pub-id-type="doi">10.3389/fmolb.2021.737821</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Molecular Biosciences</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Experimental and Meta-Analytic Validation of RNA Sequencing Signatures for Predicting Status of Microsatellite Instability</article-title>
<alt-title alt-title-type="left-running-head">Sorokin et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">RNAseq Signatures for MSI Prediction</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Sorokin</surname>
<given-names>Maksim</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/500181/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Rabushko</surname>
<given-names>Elizaveta</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1232137/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Efimov</surname>
<given-names>Victor</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1399476/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Poddubskaya</surname>
<given-names>Elena</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/814498/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sekacheva</surname>
<given-names>Marina</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1006054/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Simonov</surname>
<given-names>Alexander</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/658527/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Nikitin</surname>
<given-names>Daniil</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Drobyshev</surname>
<given-names>Aleksey</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Suntsova</surname>
<given-names>Maria</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1245497/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Buzdin</surname>
<given-names>Anton</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/64369/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Laboratory For Clinical and Genomic Bioinformatics, I.M. Sechenov First Moscow State Medical University, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Moscow Institute of Physics and Technology, <addr-line>Dolgoprudny</addr-line>, <country>Russia</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>OmicsWay Corp., <addr-line>Walnut</addr-line>, <addr-line>CA</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>Faculty of Biology, Lomonosov Moscow State University, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<aff id="aff5">
<label>
<sup>5</sup>
</label>World-Class Research Center &#x201c;Digital Biodesign and Personalized Healthcare&#x201d;, Sechenov First Moscow State Medical University, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<aff id="aff6">
<label>
<sup>6</sup>
</label>Oncobox Ltd., <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<aff id="aff7">
<label>
<sup>7</sup>
</label>Shemyakin-Ovchinnikov Institute of Bioorganic Chemistry, <addr-line>Moscow</addr-line>, <country>Russia</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/21528/overview">William C. Cho</ext-link>, QEH, Hong Kong, SAR China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/580342/overview">Xiaosheng Wang</ext-link>, China Pharmaceutical University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1317234/overview">Ximing Xu</ext-link>, Renmin Hospital of Wuhan University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Maksim Sorokin, <email>sorokin@oncobox.com</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Molecular Diagnostics and Therapeutics, a section of the journal Frontiers in Molecular Biosciences</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>23</day>
<month>11</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>8</volume>
<elocation-id>737821</elocation-id>
<history>
<date date-type="received">
<day>07</day>
<month>07</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>10</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Sorokin, Rabushko, Efimov, Poddubskaya, Sekacheva, Simonov, Nikitin, Drobyshev, Suntsova and Buzdin.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Sorokin, Rabushko, Efimov, Poddubskaya, Sekacheva, Simonov, Nikitin, Drobyshev, Suntsova and Buzdin</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Microsatellite instability (MSI) is an important diagnostic and prognostic cancer biomarker. In colorectal, cervical, ovarian, and gastric cancers, it can guide the prescription of chemotherapy and immunotherapy. In laboratory diagnostics of susceptible tumors, MSI is routinely detected by the size of marker polymerase chain reaction products encompassing frequent microsatellite expansion regions. Alternatively, MSI status is screened indirectly by immunohistochemical interrogation of microsatellite binding proteins. RNA sequencing (RNAseq) profiling is an emerging source of data for a wide spectrum of cancer biomarkers. Recently, three RNAseq-based gene signatures were deduced for establishing MSI status in tumor samples. They had 25, 15, and 14 gene products with only one common gene. However, they were developed and tested on the incomplete literature of The Cancer Genome Atlas (TCGA) sampling and never validated experimentally on independent RNAseq samples. In this study, we, for the first time, systematically validated these three RNAseq MSI signatures on the literature colorectal cancer (CRC) (<italic>n</italic>&#x20;&#x3d; 619), endometrial carcinoma (<italic>n</italic>&#x20;&#x3d; 533), gastric cancer (<italic>n</italic>&#x20;&#x3d; 380), uterine carcinosarcoma (<italic>n</italic>&#x20;&#x3d; 55), and esophageal cancer (<italic>n</italic>&#x20;&#x3d; 83) samples and on the set of experimental CRC RNAseq samples (<italic>n</italic>&#x20;&#x3d; 23) for tumors with known MSI status. We found that all three signatures performed well with area under the curve (AUC) ranges of 0.94&#x2013;1 for the experimental CRCs and 0.94&#x2013;1 for the TCGA CRC, esophageal cancer, and uterine carcinosarcoma samples. However, for the TCGA endometrial carcinoma and gastric cancer samples, only two signatures were effective with AUC 0.91&#x2013;0.97, whereas the third signature showed a significantly lower AUC of 0.69&#x2013;0.88. Software for calculating these MSI signatures using RNAseq data is included.</p>
</abstract>
<kwd-group>
<kwd>microsatellite instability</kwd>
<kwd>RNA sequencing</kwd>
<kwd>NGS</kwd>
<kwd>RNAseq</kwd>
<kwd>gene signatures</kwd>
<kwd>experimental validation</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Microsatellite instability (MSI) results from and is a marker of defective DNA mismatch repair (dMMR). Tumors accumulate multiple mutations across the genome (<xref ref-type="bibr" rid="B34">Ryan et&#x20;al., 2017</xref>). Short tandem repeats are particularly frequent targets to mismatch errors, and dMMR-linked mutations are prone to be present in microsatellite regions (tandem repeats of up to six nucleotides short stretches of DNA) (<xref ref-type="bibr" rid="B19">Johansen et&#x20;al., 2019</xref>). Detectable expansion or shrinkage of microsatellite repeats is referred to as MSI (<xref ref-type="bibr" rid="B29">Marcus et&#x20;al., 2019</xref>).</p>
<p>MSI was the second clinically approved predictive biomarker for the PD1-specific immunotherapy in adult and pediatric advanced cancer patients. In 2017, the approval of the PD1-specific checkpoint inhibitor antibody pembrolizumab for patients with high MSI was based on the evidence of clinical efficacy from five clinical trials (<xref ref-type="bibr" rid="B29">Marcus et&#x20;al., 2019</xref>). This was the first time when a cancer drug was approved based on a general, not a tumor type-specific biomarker.</p>
<p>Tumors with dMMR also have more mutations in non-microsatellite DNA and thus have more neoantigens. For example, an average figure of &#x223c;1,800 mutations and &#x223c;580 neoantigens was detected in colorectal cancers (CRCs) with dMMR compared with only &#x223c;70 mutations and &#x223c;20 predicted neoantigens in CRCs with normal MMR (<xref ref-type="bibr" rid="B23">Le et&#x20;al., 2015</xref>). An increased amount of neoantigens in dMMR tumors promotes tumor infiltration by lymphocytes (<xref ref-type="bibr" rid="B14">Dudley et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B16">Giannakis et&#x20;al., 2016</xref>), which may cause a more effective response to immunotherapy (<xref ref-type="bibr" rid="B27">Luchini et&#x20;al., 2019</xref>). This provides a theoretical basis for MSI/dMMR biomarker effectiveness for the treatment response to immune checkpoint inhibitors targeting PD-1, PD-L1, and CTLA-4 proteins (<xref ref-type="bibr" rid="B23">Le et&#x20;al., 2015</xref>).</p>
<p>The Food and Drug Administration did not specify which assay should be used to measure MSI. Currently, there are three basic options available for determining MSI status in clinical practice: immunohistochemistry (IHC) for testing dMMR, polymerase chain reaction (PCR), and genomic/exome/panel sequencing for detecting MSI (<xref ref-type="bibr" rid="B34">Ryan et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B2">Baretti and Le, 2018</xref>; <xref ref-type="bibr" rid="B47">Waalkes et&#x20;al., 2018</xref>).</p>
<p>IHC test interrogates expressions of four proteins: MLH1, MSH2, MSH6, and PMS2. dMMR is diagnosed when there is detected loss of expression of one or more such proteins (<xref ref-type="bibr" rid="B12">Danaher et&#x20;al., 2019</xref>). IHC tests for dMMR/MSI is simple and cost-effective, but it has a downside of relatively low analytic accuracy due to technical inconsistencies such as tissue fixation issues (<xref ref-type="bibr" rid="B15">Engel and Moore, 2011</xref>) and biological reasons such as missense mutations in MMR genes that can functionally inactivate protein without altering its IHC-tested expression level (<xref ref-type="bibr" rid="B36">Shia, 2008</xref>).</p>
<p>Alternatively, several PCR MSI panels have been designed, and two are most frequently used in practice: (1) two mononucleotide (<italic>BAT-25</italic> and <italic>BAT-26</italic>) and three dinucleotide (<italic>D5S346</italic>, <italic>D2S123</italic>, and <italic>D17S250</italic>) repeat panel (<xref ref-type="bibr" rid="B3">Boland et&#x20;al., 1998</xref>) and (2) five poly-A mononucleotide (<italic>BAT-25</italic>, <italic>BAT-26</italic>, <italic>NR-21</italic>, <italic>NR-24</italic>, and <italic>NR-27</italic>) repeat panel. The latter has greater sensitivity and specificity compared with the (1) panel (<xref ref-type="bibr" rid="B42">Suraweera et&#x20;al., 2002</xref>). Moreover, unlike (1), panel (2) has no requirement of having both tumors and paired healthy tissue for the test (<xref ref-type="bibr" rid="B35">Shemirani et&#x20;al., 2011</xref>). If at least two biomarkers in either panel lose stability, the tumor is diagnosed as MSI-positive.</p>
<p>As PCR testing is based on a limited number of specific microsatellite sites, this approach cannot capture full microsatellite profiles and thus cannot detect &#x223c;0.3&#x2013;10% of MSI cases (16). Furthermore, MSI prevalence and type are markedly different across the different cancer types. For example, lung, breast, and prostate cancers have only &#x223c;1&#x2013;2% MSI incidence (<xref ref-type="bibr" rid="B27">Luchini et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B29">Marcus et&#x20;al., 2019</xref>). This proportion is higher for gastric, ovarian, and cervical cancers and is maximal for CRC. These observations are reflected in specific diagnostic guidelines, and MSI testing is not routinely recommended for most tumor types. These factors limit the use of the PCR MSI test on a broad scale (<xref ref-type="bibr" rid="B48">Wang et&#x20;al., 2021</xref>).</p>
<p>DNA sequencing tests use either whole-exome sequencing (WES) or cancer gene panels. For targeted gene panels, the number of genes varies from around 200 to &#x3e;5,000 genes (<xref ref-type="bibr" rid="B47">Waalkes et&#x20;al., 2018</xref>). Thus, the analytic sites for testing MSI are strongly different among the different targeted panels, whereas the WES approach can provide more objective data, as evidenced by &#x223c;100% agreement with gold standard IHC and PCR MSI testing methods for 130 CRC patients when using the MSI sensor method (<xref ref-type="bibr" rid="B19">Johansen et&#x20;al., 2019</xref>).</p>
<p>As opposed to IHC- or PCR-based MSI testing, which are most suitable for CRC and other cancers belonging to the spectrum of Lynch syndrome, the sequencing MSI approach can be used for more tumor types. It can provide an advantage of combining MSI analysis with mutation screening and tumor mutation burden analysis (<xref ref-type="bibr" rid="B48">Wang et&#x20;al., 2021</xref>). However, genomic deep sequencing-based testing has major challenges of high cost and lack of wide availability (<xref ref-type="bibr" rid="B47">Waalkes et&#x20;al., 2018</xref>).</p>
<p>On the other hand, RNA sequencing (RNAseq) can provide another type of data for MSI assessment. In turn, the RNAseq approach has several serious advantages that make it another candidate for an emerging method of choice for MSI testing. RNAseq is a well-established technology for tumor specimens, including formalin-fixed, paraffin-embedded (FFPE) tissue samples (<xref ref-type="bibr" rid="B9">Buzdin et&#x20;al., 2020</xref>). Typically, one RNAseq analysis is less expensive than for WES or panel genomic sequencing (<xref ref-type="bibr" rid="B6">Bossel Ben-Moshe et&#x20;al., 2018</xref>). It can be informative for the assessment of IHC biomarkers (<xref ref-type="bibr" rid="B39">Sorokin et&#x20;al., 2020c</xref>; <xref ref-type="bibr" rid="B38">2020b</xref>), expression of cancer drug target genes (<xref ref-type="bibr" rid="B9">Buzdin et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B40">Sorokin et&#x20;al., 2020d</xref>), tumor-specific molecular pathway activation (<xref ref-type="bibr" rid="B10">Buzdin et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B4">Borisov et&#x20;al., 2020a</xref>), for personalized modeling of tumor drug response (<xref ref-type="bibr" rid="B21">Kim et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B45">Tkachev et&#x20;al., 2020</xref>), and even for tumor mutation burden assessment (<xref ref-type="bibr" rid="B13">DiGuardo et&#x20;al., 2021</xref>). Furthermore, RNAseq data that inform on total gene expression profiles can also be applicable for generating MSI gene signatures. Three such signatures were recently developed (<xref ref-type="bibr" rid="B12">Danaher et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici, 2019</xref>; <xref ref-type="bibr" rid="B24">Li et&#x20;al., 2020</xref>) based on TCGA project (<xref ref-type="bibr" rid="B46">Tomczak et&#x20;al., 2015</xref>) publicly available RNAseq data for CRC samples annotated with MSI status by gold standard IHC and/or PCR methods. A signature established by <xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020)</xref> includes 25 genes, a signature by <xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici (2019)</xref> includes 15 genes, and a double signature by <xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019)</xref>&#x2014;14 genes. Interestingly, those signatures are mostly different by gene content and have only one common gene (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>).</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Overlap between gene composition of MSI expression signatures developed by <xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020)</xref>, <xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici (2019)</xref>, and <xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019)</xref>.</p>
</caption>
<graphic xlink:href="fmolb-08-737821-g001.tif"/>
</fig>
<p>However, these signatures were developed and validated on the same TCGA samplings and were never validated experimentally on independent RNAseq profiles. In this study, we, for the first time, systematically validated these three RNAseq MSI signatures on the literature CRC (<italic>n</italic>&#x20;&#x3d; 619), endometrial carcinoma (<italic>n</italic>&#x20;&#x3d; 533), gastric cancer (<italic>n</italic>&#x20;&#x3d; 380), uterine carcinosarcoma (<italic>n</italic>&#x20;&#x3d; 55), and esophageal cancer (<italic>n</italic>&#x20;&#x3d; 83) samples and on the set of experimental CRC RNAseq samples (<italic>n</italic>&#x20;&#x3d; 23) for the tumors with known MSI status. As the gold experimental standard, we used seven PCR MSI biomarkers.</p>
<p>We found that all three signatures performed well with area under the curve (AUC) ranges of 0.94&#x2013;1 for the experimental CRCs and 0.94&#x2013;1 for the TCGA CRC, esophageal cancer, and uterine carcinosarcoma samples. However, for the TCGA endometrial carcinoma and gastric cancer samples, only two signatures were effective with AUC 0.91&#x2013;0.97, whereas the third signature showed a significantly lower AUC of 0.69&#x2013;0.88. Finally, we provide software for calculating these MSI signatures using RNAseq&#x20;data.</p>
</sec>
<sec sec-type="results" id="s2">
<title>Results</title>
<sec id="s2-1">
<title>Microsatellite Instability Data Curation and Analysis</title>
<p>For the literature (TCGA) dataset, we extracted MSI statuses for 1,670 available RNAseq samples from the Broad Firehose webpage. These MSI statuses obtained using IHC or PCR profiling were then considered as the gold standards for the assessment of transcriptomic signatures. As only MSI-high tumors are considered for specific therapeutic options, we pooled MSI-low and MSS (microsatellite stable) samples in a single class for further analyses. Totally, we obtained 1,340 MSI-low/MSS and 330&#x20;MSI-high profiles. These samples represented CRC, endometrial carcinoma, gastric cancer, uterine cancer, and esophageal cancer (<xref ref-type="table" rid="T1">Table&#x20;1</xref>). This was higher than the samplings used previously to validate <italic>Li</italic>, <italic>Pacinkova and Popovici</italic>, and <italic>Danaher</italic> signatures in the original studies (a total of 1,302, 626, and 689 samples, respectively; <xref ref-type="table" rid="T1">Table&#x20;1</xref>). We checked RNAseq gene signatures in binary classifier&#x20;mode.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Characteristic of literature and experimental cancer patient groups.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Validation set</th>
<th align="center">MSI-high</th>
<th align="center">MSI-low/MSS</th>
<th align="center">Total</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td colspan="4" align="left">Colorectal cancer (CRC)</td>
</tr>
<tr>
<td align="left">Current experimental</td>
<td align="center">6</td>
<td align="center">17</td>
<td align="center">23</td>
</tr>
<tr>
<td align="left">Current TCGA</td>
<td align="center">85</td>
<td align="center">534</td>
<td align="center">619</td>
</tr>
<tr>
<td align="left">Li TCGA</td>
<td align="center">55</td>
<td align="center">320</td>
<td align="center">375</td>
</tr>
<tr>
<td align="left">Pacinkova and Popovici TCGA</td>
<td align="center">35</td>
<td align="center">140</td>
<td align="center">175</td>
</tr>
<tr>
<td align="left">Danaher TCGA</td>
<td align="center">27</td>
<td align="center">126</td>
<td align="center">153</td>
</tr>
<tr>
<td colspan="4" align="left">Endometrial cancer (UCEC)</td>
</tr>
<tr>
<td align="left">&#x2003;Current TCGA</td>
<td align="center">170</td>
<td align="center">363</td>
<td align="center">533</td>
</tr>
<tr>
<td align="left">&#x2003;Li TCGA</td>
<td align="center">123</td>
<td align="center">244</td>
<td align="center">367</td>
</tr>
<tr>
<td align="left">&#x2003;Pacinkova and Popovici TCGA</td>
<td align="center">52</td>
<td align="center">64</td>
<td align="center">116</td>
</tr>
<tr>
<td align="left">&#x2003;Danaher TCGA</td>
<td align="center">71</td>
<td align="center">176</td>
<td align="center">247</td>
</tr>
<tr>
<td colspan="4" align="left">Gastric cancer (STAD)</td>
</tr>
<tr>
<td align="left">&#x2003;Current TCGA</td>
<td align="center">71</td>
<td align="center">309</td>
<td align="center">380</td>
</tr>
<tr>
<td align="left">&#x2003;Li TCGA</td>
<td align="center">80</td>
<td align="center">335</td>
<td align="center">415</td>
</tr>
<tr>
<td align="left">&#x2003;Pacinkova and Popovici TCGA</td>
<td align="center">54</td>
<td align="center">281</td>
<td align="center">335</td>
</tr>
<tr>
<td align="left">&#x2003;Danaher TCGA</td>
<td align="center">64</td>
<td align="center">225</td>
<td align="center">289</td>
</tr>
<tr>
<td colspan="4" align="left">Uterine carcinosarcoma (UCS)</td>
</tr>
<tr>
<td align="left">&#x2003;Current TCGA</td>
<td align="center">2</td>
<td align="center">53</td>
<td align="center">55</td>
</tr>
<tr>
<td align="left">&#x2003;Li TCGA</td>
<td align="center">2</td>
<td align="center">87</td>
<td align="center">89</td>
</tr>
<tr>
<td align="left">&#x2003;Pacinkova and Popovici TCGA</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">&#x2003;Danaher TCGA</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td colspan="4" align="left">Esophageal cancer (ESCA)</td>
</tr>
<tr>
<td align="left">&#x2003;Current TCGA</td>
<td align="center">2</td>
<td align="center">81</td>
<td align="center">83</td>
</tr>
<tr>
<td align="left">&#x2003;Li TCGA</td>
<td align="center">2</td>
<td align="center">54</td>
<td align="center">56</td>
</tr>
<tr>
<td align="left">&#x2003;Pacinkova and Popovici TCGA</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">&#x2003;Danaher TCGA</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td colspan="4" align="left">Control</td>
</tr>
<tr>
<td align="left">&#x2003;Current experimental</td>
<td align="center">1</td>
<td align="center">12</td>
<td align="center">13</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>For the experimental group, we profiled gene expression by RNAseq using FFPE tumor tissue blocks for a total of 23 CRC patients. In addition, we also analyzed a control group of 13&#x20;non-CRC tumor blocks to assess MSI signature performance on these samples as well. Among them, five patients had cervical cancer, two had breast cancer, two had gastric cancer, two had glioblastoma, one had ovarian cancer, and one had endometrial carcinosarcoma (<xref ref-type="sec" rid="s11">Supplementary Table S1</xref>). In total, the experimental group (<italic>n</italic>&#x20;&#x3d; 36) represented 27 female and nine male patients. The patient age varied from 31 to 84&#xa0;years; the mean patient age in the experimental group was 60.36&#xa0;years. More detailed patient information is given in <xref ref-type="sec" rid="s11">Supplementary Table&#x20;S1</xref>.</p>
<p>We performed RNAseq for each tumor sample and obtained &#x223c;3.75&#x2013;78.02 million reads uniquely mapped on known human Ensembl genes (genome version GRCh38 and transcriptome annotation GRCh38.89), on the average &#x223c;15.5 million gene-mapped reads per library.</p>
<p>For these samples, &#x201c;gold standard&#x201d; MSI statuses were determined by PCR test for seven marker microsatellite loci: BAT25, BAT26, BAT40, NR21, NR24, NR27, and CAT25 that are included in a routinely used clinical panel that requires no healthy tissue control (<xref ref-type="bibr" rid="B42">Suraweera et&#x20;al., 2002</xref>). When there were &#x2265;2 marker loci with detected unstable microsatellite length, these samples were considered MSI-high. Otherwise, the samples were put to the common MSI-low/MSS group. In the experimental group, there were a total of seven MSI-high and 29 MSI-low/MSS samples (<xref ref-type="table" rid="T1">Table&#x20;1</xref>, <xref ref-type="sec" rid="s11">Supplementary Table&#x20;S2</xref>).</p>
</sec>
<sec id="s2-2">
<title>Performance of Microsatellite Instability RNAseq Gene Signatures</title>
<p>By performing PubMed and Google Scholar literature search with keywords &#x201c;gene signature,&#x201d; &#x201c;gene expression,&#x201d; &#x201c;RNA sequencing,&#x201d; &#x201c;microsatellite instability,&#x201d;and &#x201c;MSI&#x201d; in March 2021, we extracted 73 hits that were manually processed and returned three recent original publications. These three unrelated research papers authored by <xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020)</xref>, <xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici (2019)</xref>, and <xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019)</xref> communicated different gene signatures of MSI status. All these signatures were deduced and initially validated on TCGA CRC samples available at the date of research (<xref ref-type="table" rid="T1">Table&#x20;1</xref>). For all the signatures identified, the initial bioinformatic validation cohorts were smaller than those extracted from TCGA in the current study (<xref ref-type="table" rid="T1">Table&#x20;1</xref>).</p>
<p>The signatures included 15 genes (Li), 25 genes (Pacincova and Popovici), and 14 genes (Danaher) (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). We compared gene compositions of different signatures and found that they were largely different and shared only one common gene, <italic>MLH1</italic>, which encodes for mutL homolog 1 that can heterodimerize with mismatch repair endonuclease PMS2 to form MutL alpha, part of the DNA mismatch repair system (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). Li signature shared four other genes with Danaher signature: <italic>EPM2AIP1, RNLS, SMAP1</italic>, and <italic>TTC30A</italic>. These genes encode for EPM2A interacting protein 1, renalase, small ArfGAP 1, and tetratricopeptide repeat domain 30A, respectively. Pacincova and Popovici signature also had two other common genes with Li signature: <italic>RPL22L1</italic> and <italic>SHROOM4</italic> encode for ribosomal protein L22 like 1 and shroom family member 4, respectively. Pacincova and Popovici signature had no other common genes with the Danaher signature (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>).</p>
<p>The experimental and literature samples were then used to assess the performances of those three signatures. All signature values were calculated as described in the original papers. We created and made publicly available the code for signature calculation at Gitlab: <ext-link ext-link-type="uri" xlink:href="https://gitlab.com/ef.viktor/msi_signatures">https://gitlab.com/ef.viktor/msi_signatures</ext-link>.</p>
<p>The signatures were validated using TCGA RNAseq datasets for tumor samples annotated by MSI status: CRC (<italic>n</italic>&#x20;&#x3d; 619), endometrial carcinoma (<italic>n</italic>&#x20;&#x3d; 533), gastric cancer (<italic>n</italic>&#x20;&#x3d; 380), uterine carcinosarcoma (<italic>n</italic>&#x20;&#x3d; 55), and esophageal cancer (<italic>n</italic>&#x20;&#x3d; 83) datasets and on the set of experimental CRC RNAseq samples (<italic>n</italic>&#x20;&#x3d; 23) and control experimental dataset for non-CRC cancer samples (<italic>n</italic>&#x20;&#x3d; 13). To assess signature biomarker quality, we used area under the ROC curve (ROC AUC) value as the measure. AUC reflects biomarker robustness and depends on its sensitivity and specificity (<xref ref-type="bibr" rid="B5">Borisov et&#x20;al., 2020b</xref>). It varies between 0.5 and 1, and the typical discrimination threshold is 0.7, where greater values denote high-quality biomarkers and <italic>vice versa</italic> (<xref ref-type="bibr" rid="B7">Boyd, 1997</xref>). AUC is often used for scoring different types of molecular biomarkers in oncology (<xref ref-type="bibr" rid="B26">Liu et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B44">Tanioka et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B11">Chen et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B37">Sorokin et&#x20;al., 2020a</xref>). AUC and 95% confidence intervals were calculated using DeLong&#x2019;s method implemented in pROC R-package. The entire experimental dataset contained different cancer types; therefore, AUC was calculated only for the CRC subgroup of the experimental samples.</p>
<p>In our analysis, <italic>Li</italic> MSI signature (<xref ref-type="fig" rid="F2">Figure&#x20;2A</xref>) scored AUC &#x3d; 1.0 for the experimental CRC dataset, AUC &#x3d; 0.9462 for the TCGA CRC, AUC &#x3d; 0.9397 for the TCGA uterine corpus endometrial carcinoma (UCEC), AUC &#x3d; 0.9664 for the TCGA STAD dataset, and AUC &#x3d; 0.9981 for the TCGA joint dataset of UCS &#x2b; ESCA samples. <italic>Pacincova and Popovici</italic> signature (<xref ref-type="fig" rid="F2">Figure&#x20;2B</xref>) performed as high as AUC &#x3d; 0.9412 for the experimental CRC dataset, AUC &#x3d; 0.9583 for the TCGA CRC dataset, AUC &#x3d; 0.6946 for the TCGA UCEC, AUC &#x3d; 0.8827 for the TCGA STAD dataset, and AUC &#x3d; 0.9515 for the TCGA joint dataset of UCS &#x2b; ESCA samples. In turn, <italic>Danaher</italic> signature (<xref ref-type="fig" rid="F2">Figure&#x20;2C</xref>) showed AUC &#x3d; 0.9902 for the experimental CRC dataset, AUC &#x3d; 0.9396 for the TCGA CRC dataset, AUC &#x3d; 0.9442 for the TCGA UCEC, AUC &#x3d; 0.9589 for the TCGA STAD dataset, and AUC &#x3d; 1 for the TCGA joint dataset of UCS &#x2b; ESCA samples dataset.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Performance test of MSI RNAseq gene signatures. All signatures were tested for assessment of MSI status on CRC experimental dataset, non-CRC experimental dataset, TCGA CRC dataset, TCGA UCEC dataset, TCGA STAD dataset, and joint TCGA UCS &#x2b; ESCA dataset. Results for <xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020)</xref> <bold>(A)</bold>, <xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici (2019)</xref> <bold>(B)</bold>, and <xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019)</xref> <bold>(C)</bold> gene signatures are&#x20;shown.</p>
</caption>
<graphic xlink:href="fmolb-08-737821-g002.tif"/>
</fig>
<p>Similar to variations in AUC metrics for the three signatures tested, their extents related differently to the true-positive or true-negative MSI statuses (<xref ref-type="fig" rid="F3">Figures 3A&#x2013;C</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Distribution of scores for MSI RNAseq gene signatures. X-axis shows MSI signature score, Y-axis&#x2014;number of samples. All signatures were tested for assessment of MSI status on CRC experimental dataset, experimental non-CRC (control) dataset, TCGA CRC dataset, TCGA UCEC dataset, TCGA STAD dataset, and joint TCGA UCS &#x2b; ESCA dataset. Results for <xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020)</xref> <bold>(A)</bold>, <xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici (2019)</xref> <bold>(B)</bold>, and <xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019)</xref> <bold>(C)</bold> gene signatures are&#x20;shown.</p>
</caption>
<graphic xlink:href="fmolb-08-737821-g003.tif"/>
</fig>
<p>In the experimental CRC group, there were 6&#x20;MSI-high and 17&#x20;MSI-low samples. However, in the experimental control group that included non-CRC cancers, there was only one MSI-high sample for endometrial carcinosarcoma, whereas all other samples were MSI-low (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>). All three signatures supported the true MSI status of samples in the control group (<xref ref-type="fig" rid="F3">Figures 3A&#x2013;C</xref>).</p>
<p>Assessment of MSI signatures is summarized in <xref ref-type="table" rid="T2">Table&#x20;2</xref>. It can be seen that <italic>Li</italic> signature showed the highest AUC in the experimental CRC group, followed by <italic>Danaher</italic> and <italic>Pacincova and Popovici</italic> signatures, respectively (<xref ref-type="table" rid="T2">Table&#x20;2</xref>). Also, all three signatures performed accurately on TCGA CRC, esophageal cancer, and uterine carcinosarcoma samples with AUC 0.94-1 and highly overlapping 95% confidence intervals. However, in the endometrial carcinoma (UCEC) cohort of TCGA data, <italic>Pacincova and Popovici</italic> signature showed low AUC below 0.7 threshold, whereas two other signatures showed AUC of at least 0.94. The latter also showed lower performance for TCGA gastric cancer samples (AUC &#x3d; 0.88&#x20;<italic>vs</italic>. 0.96&#x2013;0.97 in the other two signatures).</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>AUC scores and (95% confidence interval) for three RNAseq MSI gene signatures.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Signature</th>
<th align="center">
<xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020)</xref>
</th>
<th align="center">
<xref ref-type="bibr" rid="B31">Pacinkova and Popovici (2019)</xref>
</th>
<th align="center">
<xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019)</xref>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Experimental (CRC), <italic>n</italic>&#x20;&#x3d; 23</td>
<td align="char" char="(">1.0 (1&#x2013;1)</td>
<td align="char" char="(">0.9412 (0.8506&#x2013;1)</td>
<td align="char" char="(">0.9902 (0.963&#x2013;1)</td>
</tr>
<tr>
<td align="left">TCGA (CRC), <italic>n</italic>&#x20;&#x3d; 619</td>
<td align="char" char="(">0.9462 (0.9129&#x2013;0.9795)</td>
<td align="char" char="(">0.9583 (0.9313&#x2013;0.9854)</td>
<td align="char" char="(">0.9396 (0.9011&#x2013;0.9782)</td>
</tr>
<tr>
<td align="left">TCGA (UCEC), <italic>n</italic>&#x20;&#x3d; 533</td>
<td align="char" char="(">0.9397 (0.9161&#x2013;0.9633)</td>
<td align="char" char="(">0.6946 (0.6487&#x2013;0.7404)</td>
<td align="char" char="(">0.9442 (0.9202&#x2013;0.9682)</td>
</tr>
<tr>
<td align="left">TCGA (UCS &#x2b; ESCA), <italic>n</italic>&#x20;&#x3d; 138</td>
<td align="char" char="(">0.9981 (0.993&#x2013;1)</td>
<td align="char" char="(">0.9515 (0.8771&#x2013;1)</td>
<td align="char" char="(">1.0 (1&#x2013;1)</td>
</tr>
<tr>
<td align="left">TCGA (STAD), <italic>n</italic>&#x20;&#x3d; 380</td>
<td align="char" char="(">0.9664 (0.9405&#x2013;0.9922)</td>
<td align="char" char="(">0.8827 (0.839&#x2013;0.9263)</td>
<td align="char" char="(">0.9589 (0.9261&#x2013;0.9918)</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Thus, we conclude that in our tests, all three signatures were equally effective for the CRC, esophageal cancer, and uterine carcinosarcoma samples, whereas for the endometrial carcinomas and gastric cancer samples, the <italic>Danaher</italic> and <italic>Li</italic> signatures were found more effective.</p>
<p>We also separately analyzed only early-stage (stages I, IA, and IB) cancer patients from TCGA. In this case, statistical analysis could be performed only for CRC and gastric cancer groups because there were no early-stage MSI-high patients in the other groups. There were 16/13&#x20;MSI-high and 89/42&#x20;MSI-low samples in CRC and gastric cancer groups, respectively (<xref ref-type="sec" rid="s11">Supplementary Figure S1</xref>). All three signatures performed accurately on early-stage TCGA CRC with AUC 0.966&#x2013;0.997 and highly overlapping 95% confidence intervals (<xref ref-type="sec" rid="s11">Supplementary Figure S2</xref>). AUC for <italic>Li</italic> signature was the highest for predicting MSI status in gastric cancer (AUC &#x3d; 0.956), followed by <italic>Danaher</italic> (AUC &#x3d; 0.934) and <italic>Pacincova and Popovici</italic> (AUC &#x3d; 0.919) signatures (<xref ref-type="sec" rid="s11">Supplementary Figure&#x20;S2</xref>)<italic>.</italic>
</p>
</sec>
</sec>
<sec sec-type="discussion" id="s3">
<title>Discussion</title>
<p>In this study, we, for the first time, systematically compared and validated RNAseq gene signatures of MSI status in human solid tumors. All the signatures performed well on both literature and experimental samplings with the MSI statuses determined using the gold standard techniques routinely used in cancer molecular diagnostics. Interestingly, these three signatures were developed by different teams using different logical rationale and were mostly nonoverlapping with only one common gene, <italic>MLH1</italic>, which protein product heterodimerizes to form MutL alpha (<xref ref-type="bibr" rid="B25">Lindner et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B33">Pannafino and Alani, 2021</xref>), important actor of the DNA mismatch repair system that is widely associated with the Lynch syndrome known as hereditary nonpolyposis CRC, and MSI (<xref ref-type="bibr" rid="B49">Yamamoto and Imai, 2019</xref>; <xref ref-type="bibr" rid="B25">Lindner et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B41">Stinton et&#x20;al., 2021</xref>).</p>
<p>However, the functions of most other genes in the three MSI signatures strongly differ. We used Gene Ontology (GO) analysis to identify GO term &#x201c;biological processes&#x201d; enriched among the genes forming each signature. Of note, we found 23 enriched biological processes in <italic>Li</italic> gene signature (<xref ref-type="fig" rid="F4">Figure&#x20;4</xref>), 30 in <italic>Danaher</italic> signature (<xref ref-type="fig" rid="F5">Figure&#x20;5</xref>), and no significantly enriched processes in <italic>Pacincova and Popovici</italic> signature.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Biological process GO terms for genes included in Li signature. Visualized using R package enrichplot (<ext-link ext-link-type="uri" xlink:href="http://bioconductor.org/packages/release/bioc/html/enrichplot.html">http://bioconductor.org/packages/release/bioc/html/enrichplot.html</ext-link>). All terms passed Benjamini&#x2013;Hochberg adjusted <italic>p</italic>-value threshold of 0.05.</p>
</caption>
<graphic xlink:href="fmolb-08-737821-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Biological process GO terms for genes included in Danaher signature. Visualized using R package enrichplot (<ext-link ext-link-type="uri" xlink:href="http://bioconductor.org/packages/release/bioc/html/%20enrichplot.html">http://bioconductor.org/packages/release/bioc/html/enrichplot.html</ext-link>). All terms passed Benjamini&#x2013;Hochberg adjusted <italic>p</italic>-value threshold of 0.05.</p>
</caption>
<graphic xlink:href="fmolb-08-737821-g005.tif"/>
</fig>
<p>The most significant terms in <italic>Li</italic> signature were associated with meiosis, mismatch repair, and (unexpectedly) with glycogen biosynthesis (<xref ref-type="fig" rid="F4">Figure&#x20;4</xref>). Interestingly, there were previously only indirect links reported for the glycogen metabolism and Lynch syndrome (<xref ref-type="bibr" rid="B20">Kato, 2020</xref>) or MSI (<xref ref-type="bibr" rid="B22">Krausova and Korinek, 2014</xref>; <xref ref-type="bibr" rid="B30">Oh et&#x20;al., 2016</xref>), e.g., through the Wnt signaling pathway (<xref ref-type="bibr" rid="B22">Krausova and Korinek, 2014</xref>). In <italic>Danaher</italic> signature, the most significant terms were associated with mismatch repair and with somatic hypermutation of immunoglobulin genes and physiologically related processes: somatic diversification of immune receptors and immunoglobulins (<xref ref-type="fig" rid="F5">Figure&#x20;5</xref>). The latter feature is widely associated with Lynch syndrome and MSI (<xref ref-type="bibr" rid="B1">Anghileri et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B28">M&#xe4;ki-Nevala et&#x20;al., 2021</xref>). Among the signatures by <italic>Li</italic> and <italic>Danaher</italic>, &#x201c;Mismatch repair&#x201d; was the only common GO term (highlighted in italic on <xref ref-type="fig" rid="F4">Figures 4</xref> and <xref ref-type="fig" rid="F5">5</xref>), and mismatch repair deficiency is one of the most obvious reasons for MSI (<xref ref-type="bibr" rid="B18">Jin and Sinicrope, 2021</xref>). However, analysis of <italic>Pacincova and Popovici</italic> signature returned no enriched functional terms, thus evidencing that it contains quite a functionally heterogeneous gene&#x20;set.</p>
<p>We then performed Kyoto Encyclopedia of Genes and Genomes (KEGG) pathway enrichment and gene set enrichment (GSEA) analyses. The analyses returned three common statistically significantly enriched pathways for <italic>Danaher</italic> signature: &#x201c;Mismatch repair,&#x201d; &#x201c;Platinum drug resistance,&#x201d; and &#x201c;Colorectal cancer&#x201d; (<xref ref-type="sec" rid="s11">Supplementary Figures S3 and S4</xref>). Thus, GSEA and KEGG analyses confirmed our previous finding that <italic>Danaher</italic> signature is enriched by mismatch repair genes. However, neither KEGG pathway enrichment nor GSEA provided significantly enriched pathways for both <italic>Pacincova and Popovici</italic> and <italic>Li</italic> signatures.</p>
<p>This apparent gene content diversity among the signatures demonstrates that MSI can be associated with several or many processes that are not exclusively linked with DNA hypermutation and repair. This gives hope for building next-generation MSI signatures with even better performance/classifier scores.</p>
<p>Our results also imply that the <italic>Li</italic> and <italic>Danaher</italic> signatures may be effective for the CRCs, esophageal cancers, uterine carcinosarcomas, endometrial carcinomas, and gastric cancers. However, the overall effectiveness of <italic>Pacincova and Popovici</italic> signature in our tests was lower and limited to the first three among the cancer types discussed earlier. Moreover, all three signatures performed well for predicting MSI status in early-stage CRC and gastric cancer. Interestingly, the <italic>Li</italic> and <italic>Danaher</italic> signatures that were significantly enriched by genes for certain biological processes (<xref ref-type="fig" rid="F3">Figures 3</xref> and <xref ref-type="fig" rid="F4">4</xref>) were effective for more cancer types than <italic>Pacincova and Popovici</italic> signature that lacked enriched GO&#x20;terms.</p>
<p>In addition, the current experimental dataset may serve for validating new such signatures. Finally, we implemented here all the MSI signatures assessed as the free code ready to use with the user RNAseq data. In the future and after careful clinical validation, this may have a practical significance for establishing MSI statuses by screening, when available, RNAseq data for the cancers not necessarily strongly associated with the Lynch syndrome.</p>
</sec>
<sec sec-type="materials|methods" id="s4">
<title>Materials and Methods</title>
<sec id="s4-1">
<title>Patients and Samples</title>
<p>In this study, we investigated MSI status-annotated RNAseq profiles for a total of 1,693 cancer samples (one sample per individual patient). Among them, there were 619 literature CRC samples from TCGA cohort, 533 TCGA UCEC samples, 380 TCGA gastric cancer samples, 55 TCGA uterine carcinosarcoma samples, 83 TCGA esophageal cancer samples, and 36 experimental samples profiled by RNA sequencing in this study. TCGA RNAseq samples were extracted from five source datasets: COAD (colon cancer, <italic>n</italic>&#x20;&#x3d; 389) and READ (rectal cancer, <italic>n</italic>&#x20;&#x3d; 230) for &#x201c;CRC,&#x201d; UCEC (endometrial carcinoma, <italic>n</italic>&#x20;&#x3d; 533), STAD (gastric cancer, <italic>n</italic>&#x20;&#x3d; 380), UCS (uterine carcinosarcoma, <italic>n</italic>&#x20;&#x3d; 55), and ESCA (esophageal cancer, <italic>n</italic>&#x20;&#x3d; 83). MSI annotated TCGA data were downloaded from <ext-link ext-link-type="uri" xlink:href="https://gdac.broadinstitute.org/">https://gdac.broadinstitute.org/</ext-link>.</p>
<p>The experimental dataset included 23 colon cancer samples, five cervical cancer samples, two breast cancer, two gastric cancer samples, two glioblastoma samples, one ovarian cancer sample, and one endometrial carcinosarcoma sample. All experimental specimens were stored in the form of FFPE tissue blocks.</p>
</sec>
<sec id="s4-2">
<title>Gene Expression Profiling</title>
<p>To isolate RNA, 10-&#xb5;M thick paraffin slices were trimmed from each FFPE tissue block using a microtome. RNA preps were extracted using QIAGEN RNeasy FFPE Kit. RNA 6000 Nano or Qubit RNA Assay kits were used to measure RNA concentration. RNA integrity number was measured using Agilent 2100&#x20;bio-Analyzer. For depletion of ribosomal RNA and library construction, KAPA RNA Hyper with rRNA erase kit (HMR only) was used. Different adaptors were used for multiplexing samples in one sequencing run. Library concentrations and quality were measured using Qubit ds DNA HS Assay kit (Life Technologies) and Agilent Tapestation (Agilent). RNA sequencing was done using Illumina NextSeq 550 equipment for single-end sequencing, 50-bp read length, for approximately 30 million (mln) raw reads per sample. Data quality check was done on Illumina SAV. De-multiplexing was performed with the Illumina Bcl2fastq2 v 2.17 program. Sequencing data were deposited in National Center for Biotechnology Information Sequencing Read Archive under accession ID PRJNA744404.</p>
</sec>
<sec id="s4-3">
<title>Processing of Experimental RNAseq Data</title>
<p>RNAseq FASTQ files were processed with STAR aligner (<xref ref-type="bibr" rid="B50">Dobin et&#x20;al., 2013</xref>) in &#x201c;GeneCounts&#x201d; mode with the Ensembl human transcriptome annotation (Build version GRCh38 and transcript annotation GRCh38.89). Ensembl gene IDs were converted to HUGO Gene Nomenclature Committee (HGNC) gene symbols using the Complete HGNC dataset (<ext-link ext-link-type="uri" xlink:href="https://www.genenames.org/">https://www.genenames.org/</ext-link>, database version from July 13, 2017). Totally, expression levels were established for 36,596 annotated genes with the corresponding HGNC identifiers. Quantile normalization (qnorm python package) was used to normalize gene expression values.</p>
</sec>
<sec id="s4-4">
<title>Calculating Li et&#x20;al. Signature Values</title>
<p>MSI RNAseq signature described by <xref ref-type="bibr" rid="B24">Li et&#x20;al. (2020</xref>) was calculated according to the original paper. This signature defines <italic>LYG1</italic>, <italic>MSH4</italic>, and <italic>RPL22L1</italic> genes as &#x201c;plus&#x201d;-genes and <italic>DDX27, EPM2AIP1, HENMT1, MLH1, NHLRC1, NOL4L, RNLS, RTFDC1, SHROOM4, SMAP1, TTC30A,</italic> and <italic>ZSWIM3</italic> as &#x201c;minus&#x201d;-genes. The final score is a sum of log10-transformed normalized gene expression levels with consideration of each gene&#x20;sign.</p>
</sec>
<sec id="s4-5">
<title>Calculating Pacincova and Popovici Signature</title>
<p>MSI RNAseq signature described by Pacincova and Popovici was calculated according to the original paper (<xref ref-type="bibr" rid="B31">Pa&#x10d;&#xed;nkov&#xe1; and Popovici, 2019</xref>). This signature defines <italic>AGR2</italic>, <italic>TNNT1</italic>, <italic>VNN2</italic>, <italic>TNFSF9</italic>, <italic>TRIM7</italic>, and <italic>RPL22L1</italic> genes as &#x201c;plus&#x201d;-genes and <italic>ACSL6</italic>, <italic>ARID3A</italic>, <italic>ASCL2</italic>, <italic>AXIN2</italic>, <italic>EPDR1</italic>, <italic>GGT7</italic>, <italic>GNG4</italic>, <italic>KHDRBS3</italic>, <italic>KRT23</italic>, <italic>MLH1</italic>, <italic>NKD1</italic>, <italic>PLAGL2</italic>, <italic>PRR15</italic>, <italic>RUBCNL</italic>, <italic>SHROOM2</italic>, <italic>SHROOM4</italic>, <italic>TFCP2L1</italic>, <italic>TNNC2</italic>, and <italic>VAV3</italic> genes as &#x201c;minus&#x201d;-genes. The final score is a sum of log10-transformed gene expression levels with consideration of each gene&#x20;sign.</p>
</sec>
<sec id="s4-6">
<title>Calculating Danaher et&#x20;al. Signature</title>
<p>MSI RNAseq signature described by <xref ref-type="bibr" rid="B12">Danaher et&#x20;al. (2019</xref>)was calculated according to the original paper. This signature includes <italic>MLH1, MSH2, MSH6,</italic> and <italic>PMS2</italic> genes for calculating MMR loss score (MLS). First, a minimal Z-score (Zmin) of log2-transformed gene expressions was found. The final MLS &#x3d; (Zmin &#x2b; 1.03)/0.69, where 1.03 and 0.69 are the theoretical expectation and standard deviation of the minimum of four standard normal random variables, respectively.</p>
<p>Hypermutation predictor score was calculated by multiplying log2-transformed expressions of <italic>EPM2AIP1, TTC30A, SMAP1, RNLS, WNT11, SFXN1, SREBF1, TYMS, EIF5AL1,</italic> and <italic>WDR76</italic> genes by coefficients from the table given in the original article. The final hypermutation predictor score is a Z-score of the calculated value. The resulting MSI predictor score was calculated as follows:<disp-formula id="equ1">
<mml:math id="m1">
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mi mathvariant="italic">min</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">MLS</mml:mi>
<mml:mo>,</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="italic">max</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">HPS</mml:mi>
<mml:mo>,</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>The MSI predictor score is further used as a predictor of MSI-high status.</p>
</sec>
<sec id="s4-7">
<title>Functional Gene Set Enrichment Analysis</title>
<p>KEGG and GO analyses were performed using the R clusterProfiler package. EnrichKEGG and enrichGO functions were used to implement enrichment analysis. GSEA analysis was performed using the web service <ext-link ext-link-type="uri" xlink:href="http://www.webgestalt.org">http://www.webgestalt.org</ext-link>. The following non-default parameters were selected: KEGG pathways were used as a functional database, and the minimum number of genes for a category was set to 3. We used Benjamini&#x2013;Hochberg false discovery rate correction method and applied a <italic>p</italic>-value threshold of 0.05 as a cutoff value for filtering pathways and GO&#x20;terms.</p>
</sec>
<sec id="s4-8">
<title>Experimental Microsatellite Instability Assessment by Polymerase Chain Reaction</title>
<p>Genomic DNA was isolated from FFPE tissue sections using the QIAamp DNA FFPE Tissue Kit (Qiagen, Valencia,&#x20;CA).</p>
<p>We performed MSI analysis using a set of five so-called &#x201c;main&#x201d; mononucleotide repeat markers: <italic>BAT25</italic>, <italic>BAT26</italic>, <italic>NR21</italic>, and <italic>NR24</italic> selected from the revised Bethesda panel (<xref ref-type="bibr" rid="B42">Suraweera et&#x20;al., 2002</xref>) and <italic>NR27</italic> selected from the modified pentaplex panel (<xref ref-type="bibr" rid="B8">Buhard et&#x20;al., 2006</xref>). Two additional mononucleotide repeat markers were also included: <italic>BAT40</italic>, as it was shown to improve the sensitivity of MSI testing in both CRC and extra-colonic tumors (<xref ref-type="bibr" rid="B17">Hartmann et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B32">Pagin et&#x20;al., 2013</xref>) and <italic>CAT-25</italic>, which was reported to increase the sensitivity for identifying d<italic>MSH6</italic> tumors (<xref ref-type="bibr" rid="B43">Takehara et&#x20;al., 2018</xref>).</p>
<p>The primer sequences were taken from previous reports (<xref ref-type="bibr" rid="B17">Hartmann et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B42">Suraweera et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B8">Buhard et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B43">Takehara et&#x20;al., 2018</xref>). The sequences of fluorescently labeled oligonucleotides are listed in <xref ref-type="table" rid="T3">Table&#x20;3</xref>.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Oligonucleotide sequences and fluorescent labels&#x20;used.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Marker</th>
<th align="center">Gene</th>
<th align="left"/>
<th align="center">Primer sequence and fluorescent labels (5&#x2032;-3&#x2032;)</th>
<th align="center">Length (bp)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="left">BAT26</td>
<td rowspan="2" align="left">
<italic>hMSH2</italic>
</td>
<td align="center">Forward</td>
<td align="left">FAM-CTGCGGTAATCAAGTTTTTAG</td>
<td rowspan="2" align="center">183</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">AAC&#x200b;CAT&#x200b;TCA&#x200b;ACA&#x200b;TTT&#x200b;TTA&#x200b;ACC&#x200b;C</td>
</tr>
<tr>
<td rowspan="2" align="left">BAT25</td>
<td rowspan="2" align="left">
<italic>c-kit</italic>
</td>
<td align="center">Forward</td>
<td align="left">R6G-TACCAGGTGGCAAAGGGCA</td>
<td rowspan="2" align="center">153</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">TCT&#x200b;GCA&#x200b;TTT&#x200b;TAA&#x200b;CTA&#x200b;TGG&#x200b;CTC</td>
</tr>
<tr>
<td rowspan="2" align="left">NR24</td>
<td rowspan="2" align="left">
<italic>Zinc finger 2 (ZNF-2)</italic>
</td>
<td align="center">Forward</td>
<td align="left">TAMRA-GCTGAATTTTACCTCCTGAC</td>
<td rowspan="2" align="center">131</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">ATT&#x200b;GTG&#x200b;CCA&#x200b;TTG&#x200b;CAT&#x200b;TCC&#x200b;AA</td>
</tr>
<tr>
<td rowspan="2" align="left">NR21</td>
<td rowspan="2" align="left">
<italic>SLC7A8</italic>
</td>
<td align="center">Forward</td>
<td align="left">FAM-GAGTCGCTGGCACAGTTCTA</td>
<td rowspan="2" align="center">109</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">CTG&#x200b;GTC&#x200b;ACT&#x200b;CGC&#x200b;GTT&#x200b;TAC&#x200b;AA</td>
</tr>
<tr>
<td rowspan="2" align="left">NR27</td>
<td rowspan="2" align="left">
<italic>Inhibitor of apoptosis Protein-1 (IAP1)</italic>
</td>
<td align="center">Forward</td>
<td align="left">R6G-AACCATGCTTGCAAACCACT</td>
<td rowspan="2" align="center">87</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">CGA&#x200b;TAA&#x200b;TAC&#x200b;TAG&#x200b;CAA&#x200b;TGA&#x200b;CC</td>
</tr>
<tr>
<td rowspan="2" align="left">BAT40</td>
<td rowspan="2" align="left">
<italic>3-&#x3b2;-hydroxysteroid dehydrogenase (HSD3B1)</italic>
</td>
<td align="center">Forward</td>
<td align="left">ROX-AGTCCATTTTATATCCTCAAGC</td>
<td rowspan="2" align="center">145</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">GTA&#x200b;GAG&#x200b;CAA&#x200b;GAC&#x200b;CAC&#x200b;CTT&#x200b;G</td>
</tr>
<tr>
<td rowspan="2" align="left">CAT25</td>
<td rowspan="2" align="left">
<italic>Caspase 2</italic>
</td>
<td align="left">Forward</td>
<td align="left">ROX-CTTCCCAACTTCCCTGTTCTTT</td>
<td rowspan="2" align="center">109</td>
</tr>
<tr>
<td align="center">Reverse</td>
<td align="left">TGA&#x200b;GCT&#x200b;GAG&#x200b;ATC&#x200b;GTG&#x200b;CCA&#x200b;CT</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The marker DNA products were PCR amplified using the qPCRmix-HS (Evrogen, Russia). PCR was carried out in a 20-&#x3bc;l final volume containing 1&#xd7; qPCRmix-HS, 2&#x2009;<italic>p</italic>moles of each primer, and approximately 20&#xa0;ng of DNA template.</p>
<p>The marker sets (1) <italic>BAT25</italic>, <italic>BAT26</italic>, <italic>NR21</italic>, and <italic>NR27</italic> and (2) <italic>BAT-40</italic> and <italic>CAT-25</italic> were co-amplified in one PCR tube per set. The marker <italic>NR-24</italic> was amplified in a separate PCR&#x20;tube.</p>
<p>PCR conditions for the tetraplex and duplex assays consisted of an initial 2-min denaturation step at 94C, followed by 37 cycles at 94&#xb0;C for 20&#xa0;s, 54&#xb0;C for 10&#xa0;s, and 72&#xb0;C for 12&#xa0;s, with a final extension at 72&#xb0;C for 2&#xa0;min. Conditions for monoplex reaction differed in annealing temperature: 53&#xb0;C.</p>
<p>Amplified PCR products were analyzed by capillary electrophoresis performed on ABI prism 3130&#x20;&#xd7; l System (Applied Biosystems, United&#x20;States). The microsatellite marker lengths were detected by Sequence Scanner software (Applied Biosystems, United&#x20;States).</p>
<p>The cutoff for MSI status classification was chosen on the basis of the threshold of approximately 40%, according to Umar A. et&#x20;al. (2004). Tumors with instability at &#x2a7e;2 of the five main mononucleotide markers were defined as MSI-H. Samples with instability at one main marker were further tested with the additional markers. Tumors with at least one unstable additional marker were defined as MSI-high. Otherwise, tumors were classified as MSI-low/MSS.</p>
</sec>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found below: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/bioproject/PRJNA744404">https://www.ncbi.nlm.nih.gov/bioproject/PRJNA744404</ext-link>.</p>
</sec>
<sec id="s6">
<title>Ethics Statement</title>
<p>The studies involving human participants were reviewed and approved by Vitamed Oncological Clinical Center. The patients/participants provided their written informed consent to participate in this study.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>AB supervised this study. EP and MSe collected and clinically annotated cancer patient biosamples. ER, AD, and MSu performed MSI experimental PCR analyses. VE and AS implemented computational platforms. MSo and VE analyzed expression data and did statistical calculations. AB, MSo, MSe, ER, and VE wrote the paper. AB is the guarantor of this work and, as such, has full access to all of the data in the study and takes responsibility for the integrity of the data and the accuracy of the data analysis.</p>
</sec>
<sec id="s8">
<title>Funding</title>
<p>This study was financed by the Ministry of Science and Higher Education of the Russian Federation within the framework of state support for the creation and development of World-Class Research Centers &#x201c;Digital biodesign and personalized healthcare&#x201d; No 075-15-2020-926.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of Interest</title>
<p>Authors MSo and AB were employed by the company OmicsWay Corp. Authors VE, AS, and DN were employed by the company Oncobox&#x20;Ltd.</p>
<p>The remaining authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>We thank the OmicsWay research initiative for clinical and technical support. Amazon and Microsoft Azure grants supported Cloud-based computational facilities.</p>
</ack>
<sec id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmolb.2021.737821/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmolb.2021.737821/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Image4.PNG" id="SM1" mimetype="application/PNG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table2.DOCX" id="SM2" mimetype="application/DOCX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image2.PNG" id="SM3" mimetype="application/PNG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table1.XLSX" id="SM4" mimetype="application/XLSX" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image1.PNG" id="SM5" mimetype="application/PNG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image3.PNG" id="SM6" mimetype="application/PNG" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Anghileri</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Di Ianni</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Paterra</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Langella</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Eoli</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>High Tumor Mutational burden and T-Cell Activation Are Associated with Long-Term Response to Anti-PD1 Therapy in Lynch Syndrome Recurrent Glioblastoma Patient</article-title>. <source>Cancer Immunol. Immunother.</source> <volume>70</volume>, <fpage>831</fpage>&#x2013;<lpage>842</lpage>. <pub-id pub-id-type="doi">10.1007/s00262-020-02769-4</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baretti</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Le</surname>
<given-names>D. T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>DNA Mismatch Repair in Cancer</article-title>. <source>Pharmacol. Ther.</source> <volume>189</volume>, <fpage>45</fpage>&#x2013;<lpage>62</lpage>. <pub-id pub-id-type="doi">10.1016/j.pharmthera.2018.04.004</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boland</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Thibodeau</surname>
<given-names>S. N.</given-names>
</name>
<name>
<surname>Hamilton</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Sidransky</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Eshleman</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Burt</surname>
<given-names>R. W.</given-names>
</name>
<etal/>
</person-group> (<year>1998</year>). <article-title>A National Cancer Institute Workshop on Microsatellite Instability for Cancer Detection and Familial Predisposition: Development of International Criteria for the Determination of Microsatellite Instability in Colorectal Cancer</article-title>. <source>Cancer Res.</source> <volume>58</volume>, <fpage>5248</fpage>&#x2013;<lpage>5257</lpage>. </citation>
</ref>
<ref id="B4">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Borisov</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Garazha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Buzdin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020a</year>). &#x201c;<article-title>Quantitation of Molecular Pathway Activation Using RNA Sequencing Data</article-title>,&#x201d; in <source>Methods in Molecular Biology</source>. (<publisher-loc>Totowa</publisher-loc>: <publisher-name>Humana Press</publisher-name>), <fpage>189</fpage>&#x2013;<lpage>206</lpage>.<pub-id pub-id-type="doi">10.1007/978-1-0716-0138-9_15</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Borisov</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tkachev</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Garazha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Buzdin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>Cancer Gene Expression Profiles Associated with Clinical Outcomes to Chemotherapy Treatments</article-title>. <source>BMC Med. Genomics</source> <volume>13</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1186/s12920-020-00759-0</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bossel Ben-Moshe</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Gilad</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Perry</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Benjamin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Balint-Lahat</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Pavlovsky</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>mRNA-seq Whole Transcriptome Profiling of Fresh Frozen versus Archived Fixed Tissues</article-title>. <source>BMC Genomics</source> <volume>19</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1186/s12864-018-4761-3</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boyd</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Mathematical Tools for Demonstrating the Clinical Usefulness of Biochemical Markers</article-title>. <source>Scli</source> <volume>57</volume>, <fpage>46</fpage>&#x2013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.3109/00365519709168308</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buhard</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Cattaneo</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>Y. F.</given-names>
</name>
<name>
<surname>Yim</surname>
<given-names>S. F.</given-names>
</name>
<name>
<surname>Friedman</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Flejou</surname>
<given-names>J.-F.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Multipopulation Analysis of Polymorphisms in Five Mononucleotide Repeats Used to Determine the Microsatellite Instability Status of Human Tumors</article-title>. <source>Jco</source> <volume>24</volume>, <fpage>241</fpage>&#x2013;<lpage>251</lpage>. <pub-id pub-id-type="doi">10.1200/JCO.2005.02.7227</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buzdin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Garazha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Glusker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Aleshin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Poddubskaya</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>RNA Sequencing for Research and Diagnostics in Clinical Oncology</article-title>. <source>Semin. Cancer Biol.</source> <volume>60</volume>, <fpage>311</fpage>&#x2013;<lpage>323</lpage>. <pub-id pub-id-type="doi">10.1016/j.semcancer.2019.07.010</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Buzdin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Garazha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Sekacheva</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Zhukov</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Molecular Pathway Activation - New Type of Biomarkers for Tumor Morphology and Personalized Selection of Target Drugs</article-title>. <source>Semin. Cancer Biol.</source> <volume>53</volume>, <fpage>110</fpage>&#x2013;<lpage>124</lpage>. <pub-id pub-id-type="doi">10.1016/j.semcancer.2018.06.003</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>EGFR Mutation Decreases FDG Uptake in Non-small C-ell L-ung C-ancer <italic>via</italic> the NOX4/ROS/GLUT1 axis</article-title>. <source>Int. J.&#x20;Oncol.</source> <volume>54</volume>, <fpage>370</fpage>&#x2013;<lpage>380</lpage>. <pub-id pub-id-type="doi">10.3892/ijo.2018.4626</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Danaher</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Warren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ong</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Elliott</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Cesano</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ferree</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A Gene Expression Assay for Simultaneous Measurement of Microsatellite Instability and Anti-tumor Immune Activity</article-title>. <source>J.&#x20;Immunotherapy Cancer</source> <volume>7</volume>, <fpage>15</fpage>. <pub-id pub-id-type="doi">10.1186/s40425-018-0472-1</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DiGuardo</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Davila</surname>
<given-names>J.&#x20;I.</given-names>
</name>
<name>
<surname>Jackson</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Nair</surname>
<given-names>A. A.</given-names>
</name>
<name>
<surname>Fadra</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Minn</surname>
<given-names>K. T.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>RNA-seq Reveals Differences in Expressed Tumor Mutation Burden in Colorectal and Endometrial Cancers with and without Defective DNA-Mismatch Repair</article-title>. <source>J.&#x20;Mol. Diagn.</source> <volume>23</volume>, <fpage>555</fpage>&#x2013;<lpage>564</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmoldx.2021.01.008</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dobin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Schlesinger</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Drenkow</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zaleski</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Jha</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>STAR&#x003A; Ultrafast Universal RNA-Seq Aligner</article-title>. <source>Bioinformatics</source> <volume>29</volume>, <fpage>15</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts635</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dudley</surname>
<given-names>J.&#x20;C.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>M.-T.</given-names>
</name>
<name>
<surname>Le</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Eshleman</surname>
<given-names>J.&#x20;R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Microsatellite Instability as a Biomarker for PD-1 Blockade</article-title>. <source>Clin. Cancer Res.</source> <volume>22</volume>, <fpage>813</fpage>&#x2013;<lpage>820</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-15-1678</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Engel</surname>
<given-names>K. B.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>H. M.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Effects of Preanalytical Variables on the Detection of Proteins by Immunohistochemistry in Formalin-Fixed, Paraffin-Embedded Tissue</article-title>. <source>Arch. Pathol. Lab. Med.</source> <volume>135</volume>, <fpage>537</fpage>&#x2013;<lpage>543</lpage>. <pub-id pub-id-type="doi">10.5858/2010-0702-rair.1</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Giannakis</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mu</surname>
<given-names>X. J.</given-names>
</name>
<name>
<surname>Shukla</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>Z. R.</given-names>
</name>
<name>
<surname>Cohen</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Nishihara</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Genomic Correlates of Immune-Cell Infiltrates in Colorectal Carcinoma</article-title>. <source>Cell ReportsCell Rep</source> <volume>1517</volume> (<issue>4</issue>), <fpage>8571206</fpage>&#x2013;<lpage>8571865</lpage>. <comment>S2211124716303643</comment>. <pub-id pub-id-type="doi">10.1016/j.celrep.2016.10.009</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hartmann</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zanardo</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bocker-Edmonston</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Blaszyk</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Dietmaier</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Stoehr</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2002</year>). <article-title>Frequent Microsatellite Instability in Sporadic Tumors of the Upper Urinary Tract</article-title>. <source>Cancer Res.</source> <volume>62</volume>, <fpage>6796</fpage>&#x2013;<lpage>6802</lpage>. </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jin</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Sinicrope</surname>
<given-names>F. A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Prognostic and Predictive Values of Mismatch Repair Deficiency in Non-metastatic Colorectal Cancer</article-title>. <source>Cancers</source> <volume>13</volume>, <fpage>300</fpage>&#x2013;<lpage>316</lpage>. <pub-id pub-id-type="doi">10.3390/cancers13020300</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Johansen</surname>
<given-names>A. F. B.</given-names>
</name>
<name>
<surname>Kassentoft</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>Knudsen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Laursen</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Madsen</surname>
<given-names>A. H.</given-names>
</name>
<name>
<surname>Iversen</surname>
<given-names>L. H.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Validation of Computational Determination of Microsatellite Status Using Whole Exome Sequencing Data from Colorectal Cancer Patients</article-title>. <source>BMC Cancer</source> <volume>19</volume>, <fpage>971</fpage>. <pub-id pub-id-type="doi">10.1186/s12885-019-6227-7</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kato</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Pathology of clear Cell Carcinoma of the Ovary: A Basic View Based on Cultured Cells and Modern View from Comprehensive Approaches</article-title>. <source>Pathol. Int.</source> <volume>70</volume>, <fpage>591</fpage>&#x2013;<lpage>601</lpage>. <pub-id pub-id-type="doi">10.1111/pin.12954</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>E. L.</given-names>
</name>
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kantelhardt</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Kalasauskas</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Sprang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Fauss</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Intratumoral Heterogeneity and Longitudinal Changes in Gene Expression Predict Differential Drug Sensitivity in Newly Diagnosed and Recurrent Glioblastoma</article-title>. <source>Cancers</source> <volume>12</volume>, <fpage>520</fpage>. <pub-id pub-id-type="doi">10.3390/cancers12020520</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Krausova</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Korinek</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Wnt Signaling in Adult Intestinal Stem Cells and Cancer</article-title>. <source>Cell Signal.</source> <volume>26</volume>, <fpage>570</fpage>&#x2013;<lpage>579</lpage>. <pub-id pub-id-type="doi">10.1016/j.cellsig.2013.11.032</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Uram</surname>
<given-names>J.&#x20;N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bartlett</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Kemberling</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Eyring</surname>
<given-names>A. D.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>PD-1 Blockade in Tumors with Mismatch-Repair Deficiency</article-title>. <source>N. Engl. J.&#x20;Med.</source> <volume>372</volume>, <fpage>2509</fpage>&#x2013;<lpage>2520</lpage>. <pub-id pub-id-type="doi">10.1056/nejmoa1500596</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>PreMSIm: An R Package for Predicting Microsatellite Instability from the Expression Profiling of a Gene Panel in Cancer</article-title>. <source>Comput. Struct. Biotechnol. J.</source> <volume>18</volume>, <fpage>668</fpage>&#x2013;<lpage>675</lpage>. <pub-id pub-id-type="doi">10.1016/j.csbj.2020.03.007</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lindner</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Schachtner</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tulchiner</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Thurnher</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Untergasser</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Obrist</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Lynch Syndrome: Its Impact on Urothelial Carcinoma</article-title>. <source>Ijms</source> <volume>22</volume>, <fpage>531</fpage>. <pub-id pub-id-type="doi">10.3390/ijms22020531</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Kang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Noninvasively Evaluating the Grading and IDH1 Mutation Status of Diffuse Gliomas by Three-Dimensional Pseudo-continuous Arterial Spin Labeling and Diffusion-Weighted Imaging</article-title>. <source>Neuroradiology</source> <volume>60</volume>, <fpage>693</fpage>&#x2013;<lpage>702</lpage>. <pub-id pub-id-type="doi">10.1007/s00234-018-2021-5</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luchini</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Bibeau</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ligtenberg</surname>
<given-names>M. J.&#x20;L.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Nottegar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bosse</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>ESMO Recommendations on Microsatellite Instability Testing for Immunotherapy in Cancer, and its Relationship with PD-1/pd-L1 Expression and Tumour Mutational burden: A Systematic Review-Based Approach</article-title>. <source>Ann. Oncol.</source> <volume>30</volume>, <fpage>1232</fpage>&#x2013;<lpage>1243</lpage>. <pub-id pub-id-type="doi">10.1093/annonc/mdz116</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>M&#xe4;ki&#x2010;Nevala</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ukwattage</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Olkinuora</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Almusa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ahtiainen</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ristim&#xe4;ki</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Somatic Mutation Profiles as Molecular Classifiers of Ulcerative Colitis&#x2010;associated Colorectal Cancer</article-title>. <source>Int. J.&#x20;Cancer</source> <volume>148</volume>, <fpage>2997</fpage>&#x2013;<lpage>3007</lpage>. <pub-id pub-id-type="doi">10.1002/ijc.33492</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marcus</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Lemery</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Keegan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pazdur</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>FDA Approval Summary: Pembrolizumab for the Treatment of Microsatellite Instability-High Solid Tumors</article-title>. <source>Clin. Cancer Res.</source> <volume>25</volume>, <fpage>3753</fpage>&#x2013;<lpage>3758</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-18-4070</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Oh</surname>
<given-names>B. Y.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.-Y.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>Y. S.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>T. W.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S. H.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Twist1-induced Epithelial-Mesenchymal Transition According to Microsatellite Instability Status in colon Cancer Cells</article-title>. <source>Oncotarget</source> <volume>7</volume>, <fpage>57066</fpage>&#x2013;<lpage>57076</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.10974</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pa&#x10d;&#xed;nkov&#xe1;</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Popovici</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Cross-platform Data Analysis Reveals a Generic Gene Expression Signature for Microsatellite Instability in Colorectal Cancer</article-title>. <source>Biomed. Res. Int.</source> <volume>2019</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1155/2019/6763596</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pagin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zerimech</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Leclerc</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wacrenier</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lejeune</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Descarpentries</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Evaluation of a New Panel of Six Mononucleotide Repeat Markers for the Detection of DNA Mismatch Repair-Deficient Tumours</article-title>. <source>Br. J.&#x20;Cancer</source> <volume>108</volume>, <fpage>2079</fpage>&#x2013;<lpage>2087</lpage>. <pub-id pub-id-type="doi">10.1038/bjc.2013.213</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pannafino</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Alani</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Coordinated and Independent Roles for MLH Subunits in DNA Repair</article-title>. <source>Cells</source> <volume>10</volume>, <fpage>948</fpage>. <pub-id pub-id-type="doi">10.3390/cells10040948</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ryan</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sheahan</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Creavin</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Mohan</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Winter</surname>
<given-names>D. C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The Current Value of Determining the Mismatch Repair Status of Colorectal Cancer: A Rationale for Routine Testing</article-title>. <source>Crit. Rev. Oncology/Hematology</source> <volume>116</volume>, <fpage>38</fpage>&#x2013;<lpage>57</lpage>. <pub-id pub-id-type="doi">10.1016/j.critrevonc.2017.05.006</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shemirani</surname>
<given-names>A. I.</given-names>
</name>
<name>
<surname>Haghighi</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Zadeh</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Fatemi</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Taleghani</surname>
<given-names>M. Y.</given-names>
</name>
<name>
<surname>Zali</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Simplified MSI Marker Panel for Diagnosis of Colorectal Cancer</article-title>. <source>Asian Pac. J.&#x20;Cancer Prev.</source> <volume>12</volume>, <fpage>2101</fpage>&#x2013;<lpage>2104</lpage>. </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shia</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Immunohistochemistry versus Microsatellite Instability Testing for Screening Colorectal Cancer Patients at Risk for Hereditary Nonpolyposis Colorectal Cancer Syndrome</article-title>. <source>J.&#x20;Mol. Diagn.</source> <volume>10</volume>, <fpage>293</fpage>&#x2013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.2353/jmoldx.2008.080031</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ignatev</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Barbara</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Vladimirova</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Muraveva</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Suntsova</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2020a</year>). <article-title>Molecular Pathway Activation Markers Are Associated with Efficacy of Trastuzumab Therapy in Metastatic HER2-Positive Breast Cancer Better Than Individual Gene Expression Levels</article-title>. <source>Biochem. Mosc.</source> <volume>85</volume>, <fpage>758</fpage>&#x2013;<lpage>772</lpage>. <pub-id pub-id-type="doi">10.1134/S0006297920070044</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ignatev</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Poddubskaya</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Vladimirova</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Gaifullin</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Lantsov</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2020b</year>). <article-title>RNA Sequencing in Comparison to Immunohistochemistry for Measuring Cancer Biomarkers in Breast Cancer and Lung Cancer Specimens</article-title>. <source>Biomedicines</source> <volume>8</volume>, <fpage>114</fpage>. <pub-id pub-id-type="doi">10.3390/BIOMEDICINES8050114</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kholodenko</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Kalinovsky</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Shamanskaya</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Doronin</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Konovalov</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2020c</year>). <article-title>RNA Sequencing-Based Identification of Ganglioside GD2-Positive Cancer Phenotype</article-title>. <source>Biomedicines</source> <volume>8</volume>, <fpage>142</fpage>. <pub-id pub-id-type="doi">10.3390/BIOMEDICINES8060142</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Poddubskaya</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Baranova</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Glusker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kogoniya</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Markarova</surname>
<given-names>E.</given-names>
</name>
<etal/>
</person-group> (<year>2020d</year>). <article-title>RNA Sequencing Profiles and Diagnostic Signatures Linked with Response to Ramucirumab in Gastric Cancer</article-title>. <source>Cold Spring Harb. Mol. Case Stud.</source> <volume>6</volume>, <fpage>a004945</fpage>. <pub-id pub-id-type="doi">10.1101/MCS.A004945</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stinton</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Jordan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fraser</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Auguste</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Court</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Al-Khudairy</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Testing Strategies for Lynch Syndrome in People with Endometrial Cancer: Systematic Reviews and Economic Evaluation</article-title>. <source>Health Technol. Assess.</source> <volume>25</volume>, <fpage>1</fpage>&#x2013;<lpage>216</lpage>. <pub-id pub-id-type="doi">10.3310/hta25420</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Suraweera</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Duval</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Reperant</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Vaury</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Furlan</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Leroy</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2002</year>). <article-title>Evaluation of Tumor Microsatellite Instability Using Five Quasimonomorphic Mononucleotide Repeats and Pentaplex PCR</article-title>. <source>Gastroenterology</source> <volume>123</volume>, <fpage>1804</fpage>&#x2013;<lpage>1811</lpage>. <pub-id pub-id-type="doi">10.1053/gast.2002.37070</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Takehara</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Nagasaka</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Nyuya</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Haruma</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Haraga</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mori</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Accuracy of Four Mononucleotide-Repeat Markers for the Identification of DNA Mismatch-Repair Deficiency in Solid Tumors</article-title>. <source>J.&#x20;Transl. Med.</source> <volume>16</volume>, <fpage>5</fpage>. <pub-id pub-id-type="doi">10.1186/s12967-017-1376-4</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tanioka</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Parker</surname>
<given-names>J.&#x20;S.</given-names>
</name>
<name>
<surname>Hoadley</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Integrated Analysis of RNA and DNA from the Phase III Trial CALGB 40601 Identifies Predictors of Response to Trastuzumab-Based Neoadjuvant Chemotherapy in HER2-Positive Breast Cancer</article-title>. <source>Clin. Cancer Res.</source> <volume>24</volume>, <fpage>5292</fpage>&#x2013;<lpage>5304</lpage>. <pub-id pub-id-type="doi">10.1158/1078-0432.CCR-17-3431</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Tkachev</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Sorokin</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Garazha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Borisov</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Buzdin</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). &#x201c;<article-title>Oncobox Method for Scoring Efficiencies of Anticancer Drugs Based on Gene Expression Data</article-title>,&#x201d; in <source>Methods in Molecular Biology</source> (<publisher-loc>Totowa</publisher-loc>: <publisher-name>Humana Press</publisher-name>), <fpage>235</fpage>&#x2013;<lpage>255</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-0716-0138-9_17</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tomczak</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Czerwi&#x144;ska</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wiznerowicz</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Review the Cancer Genome Atlas (TCGA): an Immeasurable Source of Knowledge</article-title>. <source>wo</source> <volume>1A</volume>, <fpage>68</fpage>&#x2013;<lpage>77</lpage>. <pub-id pub-id-type="doi">10.5114/wo.2014.47136</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waalkes</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Penewit</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hempelmann</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Konnick</surname>
<given-names>E. Q.</given-names>
</name>
<name>
<surname>Hause</surname>
<given-names>R. J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Accurate Pan-Cancer Molecular Diagnosis of Microsatellite Instability by Single-Molecule Molecular Inversion Probe Capture and High-Throughput Sequencing</article-title>. <source>Clin. Chem.</source> <volume>64</volume>, <fpage>950</fpage>&#x2013;<lpage>958</lpage>. <pub-id pub-id-type="doi">10.1373/clinchem.2017.285981</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Buzdin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>FDA-approved and Emerging Next Generation Predictive Biomarkers for Immune Checkpoint Inhibitors in Cancer Patients</article-title>. <source>Front. Oncol.</source> <volume>11</volume>, <fpage>683419</fpage>. <pub-id pub-id-type="doi">10.3389/fonc.2021.683419</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yamamoto</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Imai</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>An Updated Review of Microsatellite Instability in the Era of Next-Generation Sequencing and Precision Medicine</article-title>. <source>Semin. Oncol.</source> <volume>46</volume>, <fpage>261</fpage>&#x2013;<lpage>270</lpage>. <pub-id pub-id-type="doi">10.1053/j.seminoncol.2019.08.003</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>