<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Pediatr.</journal-id>
<journal-title>Frontiers in Pediatrics</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Pediatr.</abbrev-journal-title>
<issn pub-type="epub">2296-2360</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fped.2021.795529</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Pediatrics</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Aberrant <italic>GATA2</italic> Activation in Pediatric B-Cell Acute Lymphoblastic Leukemia</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Han</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1509372/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Cui</surname> <given-names>Bowen</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1553241/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sun</surname> <given-names>Huiying</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Fang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1544636/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Rao</surname> <given-names>Jianan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Ronghua</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname> <given-names>Shuang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1333357/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Shen</surname> <given-names>Shuhong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/174278/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Liu</surname> <given-names>Yu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1049747/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Pediatric Translational Medicine Institute, Shanghai Children&#x00027;s Medical Center, School of Medicine, Shanghai Jiao Tong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Key Laboratory of Pediatric Hematology &#x00026; Oncology Ministry of Health, Department of Hematology &#x00026; Oncology, Shanghai Children&#x00027;s Medical Center, School of Medicine, Shanghai Jiao Tong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Jan-Henning Klusmann, Martin Luther University of Halle-Wittenberg, Germany</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Ilaria Iacobucci, St. Jude Children&#x00027;s Research Hospital, United States; Zhijie Wu, National Institutes of Health (NIH), United States</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Yu Liu <email>liuyu&#x00040;scmc.com.cn</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Pediatric Hematology and Hematological Malignancies, a section of the journal Frontiers in Pediatrics</p></fn></author-notes>
<pub-date pub-type="epub">
<day>11</day>
<month>01</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>9</volume>
<elocation-id>795529</elocation-id>
<history>
<date date-type="received">
<day>01</day>
<month>11</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>12</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2022 Wang, Cui, Sun, Zhang, Rao, Wang, Zhao, Shen and Liu.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Wang, Cui, Sun, Zhang, Rao, Wang, Zhao, Shen and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract><p><italic>GATA2</italic> is a transcription factor that is critical for the generation and survival of hematopoietic stem cells (HSCs). It also plays an important role in the regulation of myeloid differentiation. Accordingly, <italic>GATA2</italic> expression is restricted to HSCs and hematopoietic progenitors as well as early erythroid cells and megakaryocytic cells. Here we identified aberrant <italic>GATA2</italic> expression in B-cell acute lymphoblastic leukemia (B-ALL) by analyzing transcriptome sequencing data obtained from St. Jude Cloud. Differentially expressed genes upon <italic>GATA2</italic> activation showed significantly myeloid-like transcription signature. Further analysis identified several tumor-associated genes as targets of <italic>GATA2</italic> activation including <italic>BAG3</italic> and <italic>EPOR</italic>. In addition, the correlation between <italic>KMT2A-USP2</italic> fusion and <italic>GATA2</italic> activation not only indicates a potential trans-activating mechanism of <italic>GATA2</italic> but also suggests that <italic>GATA2</italic> is a target of KMT2A-USP2. Furthermore, by integrating whole-genome and transcriptome sequencing data, we showed that <italic>GATA2</italic> is also cis activated. A somatic focal deletion located in the <italic>GATA2</italic> neighborhood that disrupts the boundaries of topologically associating domains was identified in one B-ALL patient with <italic>GATA2</italic> activation. These evidences support the hypothesis that <italic>GATA2</italic> could be involved in leukemogenesis of B-ALL and can be transcriptionally activated through multiple mechanisms. The findings of aberrant activation of <italic>GATA2</italic> and its molecular function extend our understanding of transcriptional factor dysregulation in B-ALL.</p></abstract>
<kwd-group>
<kwd><italic>GATA2</italic></kwd>
<kwd>pediatric B-cell acute lymphoblastic leukemia</kwd>
<kwd>leukemogenesis</kwd>
<kwd>transcriptional dysregulation</kwd>
<kwd>cis-activation</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content></contract-sponsor>
<contract-sponsor id="cn002">Science and Technology Commission of Shanghai Municipality<named-content content-type="fundref-id">10.13039/501100003399</named-content></contract-sponsor>
<counts>
<fig-count count="5"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="48"/>
<page-count count="12"/>
<word-count count="6750"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Pediatric acute lymphoblastic leukemia (ALL) is the most common malignant disease in children (<xref ref-type="bibr" rid="B1">1</xref>). Although studies have shown improved cure rates, with the overall survival rate of pediatric ALL patients exceeding 90% (<xref ref-type="bibr" rid="B2">2</xref>), the prognosis of some leukemia subtypes remains poor. For example, only 75% of T-cell acute lymphoblastic leukemia (T-ALL) patients achieve remission (<xref ref-type="bibr" rid="B3">3</xref>), and patients with the B-cell acute lymphoblastic leukemia (B-ALL) subtypes of <italic>BCR-ABL1, BCR-ABL1</italic> like, and <italic>KMT2A</italic> (<italic>MLL</italic>) rearranged have a high risk of treatment failure and poor prognosis (<xref ref-type="bibr" rid="B4">4</xref>&#x02013;<xref ref-type="bibr" rid="B7">7</xref>).</p>
<p>Advances in genome-wide analyses have enabled researchers to obtain a detailed view of the genetic alterations involved in the pathogenesis of ALL (<xref ref-type="bibr" rid="B8">8</xref>). The coordinated action of transcription factors controls early lymphoid development and leukemia formation, and many of these transcription factors have been found to be dysregulated in ALL (<xref ref-type="bibr" rid="B9">9</xref>). Patients with B-ALL harbor many genetic alterations in transcription factors including chromosomal rearrangements, deletions, or inactivating mutations in <italic>DUX4, PAX5, IKZF1</italic>, and <italic>TCF3</italic>, among others (<xref ref-type="bibr" rid="B10">10</xref>). For example, the <italic>PAX5</italic> P80R mutation impairs B cell differentiation and drives B lymphoid leukemogenesis (<xref ref-type="bibr" rid="B11">11</xref>). Patients with mutation or deletion of <italic>IKZF1</italic> were verified to have high levels of residual disease at day 19 and poor outcomes (<xref ref-type="bibr" rid="B12">12</xref>). T-ALL is also characterized by the dysregulation of core transcription factors, including <italic>TAL1/2, LMO1/2</italic>, and <italic>TLX1/3</italic>, caused by chromosomal rearrangements and copy number alterations (<xref ref-type="bibr" rid="B13">13</xref>, <xref ref-type="bibr" rid="B14">14</xref>). Notably, 8&#x02013;10% of T-ALL (<xref ref-type="bibr" rid="B14">14</xref>) and 7% of B-ALL (<xref ref-type="bibr" rid="B11">11</xref>) cases cannot be categorized into any of the currently established subtypes based on genome variation, and such cases commonly have inferior outcomes (<xref ref-type="bibr" rid="B8">8</xref>). Studies on novel driver transcription factor dysregulation could assist subtype classification and the development of targeted therapies for these patients with unknown drivers.</p>
<p>GATA family proteins are tissue-specific master transcriptional regulators, among GATAs, <italic>GATA1, GATA2</italic>, and <italic>GATA3</italic> have lineage-specific functions which are essential for normal hematopoiesis (<xref ref-type="bibr" rid="B15">15</xref>). <italic>GATA1</italic> is the main driver for the differentiation of hematopoietic progenitors into specific blood cell lineages, leading to a loss of self-renewal capacity (<xref ref-type="bibr" rid="B16">16</xref>). <italic>GATA2</italic> regulates the proliferation of hematopoietic stem cells (HSCs) and maintains the HSC pool (<xref ref-type="bibr" rid="B17">17</xref>). <italic>GATA3</italic> is pivotal for the development of T lymphocytes (<xref ref-type="bibr" rid="B15">15</xref>). Dysregulation and mutation of these three GATA transcription members are involved in leukemogenesis. For example, the <italic>GATA3</italic> expression level was linked to leukemogenesis (<xref ref-type="bibr" rid="B18">18</xref>), and recurrent mutations in the DNA binding domain of <italic>GATA3</italic> were detected in ETP-ALL patients and found to block T cell development (<xref ref-type="bibr" rid="B19">19</xref>). Heterozygous deletions of <italic>GATA2</italic>, which has been recognized as an acute myeloid leukemia (AML) predisposition gene (<xref ref-type="bibr" rid="B20">20</xref>), promote <italic>EVI1</italic>-provoked leukemic transformation (<xref ref-type="bibr" rid="B21">21</xref>). And high expression of <italic>GATA2</italic> in AML was associated with adverse prognosis (<xref ref-type="bibr" rid="B22">22</xref>). However, these findings were made only within the context of the specific lineage each GATA member was known to be physiologically associated with. Little is known regarding the aberrant activation of these transcription factors in other lineages.</p>
<p>In the present study, we identified the first time aberrant <italic>GATA2</italic> activation in a subset of B-ALL patients. The transcriptome sequencing (RNA-seq) datasets of 629 B-ALL patients obtained from St. Jude Cloud (<xref ref-type="bibr" rid="B23">23</xref>) were used to identify B-ALL patients with outlier <italic>GATA2</italic> expression. The effect of <italic>GATA2</italic> activation was further explored by differential expression analysis and transcription factor binding motif analysis, and several downstream targets of <italic>GATA2</italic> activation were identified. Finally, by integrating data from whole-genome sequencing, transcriptome sequencing, and 3-D genome analysis, we found that <italic>GATA2</italic> was potentially transcriptionally activated by multiple mechanisms, both cis and trans.</p>
</sec>
<sec sec-type="materials and methods" id="s2">
<title>Materials and Methods</title>
<sec>
<title>Gene Expression in Pediatric B-ALL and Differentially Expressed Gene Analysis</title>
<p>Count values generated from RNA-seq data of leukemia patients were downloaded from St. Jude Cloud (<xref ref-type="bibr" rid="B23">23</xref>). FPKM values were calculated from count values with an in-house perl script. Cases with <italic>GATA2</italic> FPKM values &#x0003E;3-fold standard deviation of the mean in each subtype were categorized as <italic>GATA2</italic> activation. Protein-coding genes with FPKM &#x0003E;1 in at least 30% of patients were defined as expressed genes and collected for further analysis. Batch effects introduced by different sequencing protocols (<xref ref-type="supplementary-material" rid="SM5">Supplementary Table 1</xref>) were corrected with DESeq2. Differentially expressed gene (DEG) analysis was performed on the expressed genes using DESeq2 (<xref ref-type="bibr" rid="B24">24</xref>) with subtype as a covariate. Genes with fold change &#x0003E;1.5 and <italic>p</italic>-value &#x0003C; 0.05 were identified as DEGs.</p>
</sec>
<sec>
<title>Gene Set Enrichment Analysis</title>
<p>Gene set enrichment analysis of genes up-regulated and down-regulated upon <italic>GATA2</italic> activation was performed using ToppGene (<xref ref-type="bibr" rid="B25">25</xref>). The categories with top significance enriched in Gene Ontology (GO) terms and ToppCell Altas which points to cell type in ToppGene gene set were shown in figures.</p>
</sec>
<sec>
<title>Transcription Binding Motif Analysis</title>
<p>GATA2 ChIP-seq data (GSM1600544) from the LNCaP cell line was used to calculate the distance between GATA2 peaks and the transcription start site (TSS) of the nearest gene to determine the genomic range for motif analysis. According to the results, the 200 bp sequences centered on the TSS of protein coding genes across the whole genome were analyzed with FIMO (<xref ref-type="bibr" rid="B26">26</xref>) for the presence of the transcription factor binding motif of the GATA family. Predictions with a <italic>p</italic>-value &#x0003C; 0.0001 were considered positive.</p>
</sec>
<sec>
<title>Allelic Specific Expression Analysis</title>
<p>The heterozygous markers and RNA-seq BAM file for SJALL043839_D1 were obtained from previously published data (<xref ref-type="bibr" rid="B27">27</xref>). Allelic specific expression (ASE) analysis was performed with cis-X (<xref ref-type="bibr" rid="B28">28</xref>) following the user&#x00027;s instructions. The ASE of <italic>GATA2</italic> was calculated with in-house R script.</p>
</sec>
<sec>
<title>Data Visualization</title>
<p>The protein structure of the in-frame KMT2A-USP2 fusion was visualized with ProteinPaint (<xref ref-type="bibr" rid="B29">29</xref>). The topologically associating domain (TAD) structure from high-through chromosome conformation capture (Hi-C) data from the Nalm6 and Kelly cell line, and the coverage plot of whole-genome sequencing (WGS) data of tumor and matched remission sample of SJALL043839 were visualized with GenomePaint (<xref ref-type="bibr" rid="B30">30</xref>).</p>
</sec>
<sec>
<title>Statistical Analysis</title>
<p>The DEG analysis was performed with DESeq2. GATA family member expression between different lineages of leukemia was compared using Wilcoxon test. The correlation in expression between <italic>GATA2</italic> and potential target genes was calculated with Pearson correlation. All analysis were performed in R (version 3.5.3).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Aberrant <italic>GATA2</italic> Transcription in B-Cell Acute Lymphoblastic Leukemia</title>
<p>We examined the RNA expression of three hematopoietic GATA transcription factors (<italic>GATA1, GATA2</italic>, and <italic>GATA3</italic>) in a total of 1,644 pediatric leukemia patients with AML (<italic>n</italic> = 297), T-ALL (<italic>n</italic> = 99), and B-ALL (<italic>n</italic> = 1,248) using RNA-seq data available at St. Jude Cloud (<xref ref-type="bibr" rid="B23">23</xref>) (<xref ref-type="fig" rid="F1">Figure 1A</xref>). Consistent with their established roles in hemopoiesis (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B31">31</xref>), the three GATA transcription factors showed lineage specific patterns of transcription. <italic>GATA1</italic> and <italic>GATA2</italic> were more highly transcribed in AML as compared with B-ALL (<italic>p</italic>-value &#x0003C; 0.0001, Wilcoxon test) and T-ALL (<italic>p</italic>-value &#x0003C; 0.0001, Wilcoxon test), and <italic>GATA3</italic> showed the highest level of transcription in T-ALL (<italic>p</italic>-values &#x0003C; 0.0001 in comparison with AML and B-ALL, Wilcoxon test). On the other hand, transcription levels of all three GATA genes were low in B-ALL. In particular, we found that <italic>GATA2</italic> was not transcribed in the majority of B-ALL patients, with FPKM values &#x0003C;1 in 79.4% (991 out of 1,248) cases (median FPKM = 0.297). The lack of <italic>GATA2</italic> transcription in B-ALL was in accordance with its role in common lymphoid progenitor cells during normal hemopoiesis (<xref ref-type="bibr" rid="B32">32</xref>). However, it was noticeable that <italic>GATA2</italic> was actively transcribed in a subset of B-ALL patients (<italic>n</italic> = 257 with FPKM &#x0003E; 1).</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Aberrant transcription of <italic>GATA2</italic> in leukemia. <bold>(A)</bold> Violin plots showing the expression of three hematopoietic GATA transcription factors in pediatric leukemia patients; expression data are from St. Jude Cloud (AML <italic>n</italic> = 297, T-ALL <italic>n</italic> = 99, B-ALL <italic>n</italic> =1,248). &#x0002A;&#x0002A;&#x0002A;<italic>p</italic> &#x0003C; 0.001. <bold>(B)</bold> The <italic>GATA2</italic> expression levels in 629 B-ALL patients with definitive subtype information were plotted. Thirteen <italic>GATA2</italic>-outlier patients were shown in red dots. <bold>(C)</bold> Information from 13 <italic>GATA2</italic>-outlier cases (i.e., sample ID, subtype, major type of fusion, and <italic>GATA2</italic> FPKM) is listed.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fped-09-795529-g0001.tif"/>
</fig>
<p>We next asked if <italic>GATA2</italic> transcription was enriched in a specific B-ALL subtype. Toward this end, we checked transcription levels of <italic>GATA2</italic> in 629 of the 1,248 B-ALL cases mentioned above, for which definitive subtype information was available. First of all, we found that active transcription of <italic>GATA2</italic> was associated with <italic>ETV6-RUNX1</italic> rearranged B-ALL (ETV, <xref ref-type="fig" rid="F1">Figure 1B</xref>, median FPKM = 2.26, <italic>p</italic> &#x0003C; 0.0001, Wilcoxon test, ETV compared with non-ETV). Secondly, aberrantly high <italic>GATA2</italic> transcription was observed in a subset of B-ALL patients across different subtypes. We next identified the cases with outlier <italic>GATA2</italic> transcription defined as <italic>GATA2</italic> transcription levels greater than three standard deviations of the mean in each subtype. Aberrant transcription was analyzed within each subtype to minimize the variation across different subtypes. According to this criterion, a total of 13 B-ALL cases with aberrant activation of <italic>GATA2</italic> were identified from 7 subtypes (<xref ref-type="fig" rid="F1">Figure 1B</xref>), accounting for 2.07% of B-ALL cases. These 13 B-ALL cases included five with high hyperdiploid (HYPER), two with <italic>KMT2A</italic> rearrangements (MLL), two with ETV, and one each with <italic>DUX4</italic> rearrangement (DUX4), low hypodiploid (HYPO), <italic>BCR-ABL1</italic> (PH), and <italic>BCR-ABL1</italic>-like (PHL) (<xref ref-type="fig" rid="F1">Figure 1C</xref>). In addition, no outlier <italic>GATA2</italic> transcription was identified for the following four subtypes: <italic>TCF3-PBX1</italic> (E2A), <italic>MEF2D</italic> rearrangements (MEF2D), <italic>PAX5</italic> alterations or mutations (PAX5), and <italic>ZNF384</italic> rearrangements (ZNF384) (<xref ref-type="fig" rid="F1">Figure 1B</xref>; <xref ref-type="supplementary-material" rid="SM5">Supplementary Table 1</xref>). To further investigate the effect of <italic>GATA2</italic> activation, we selected 584 patients from seven subtypes with at least one <italic>GATA2</italic> outlier case identified. Among these 584 cases, 13 cases with aberrant activation of <italic>GATA2</italic> were classified as the <italic>GATA2</italic>-outlier group and the remaining cases (<italic>n</italic> = 571) as the <italic>GATA2</italic>-normal group.</p>
</sec>
<sec>
<title>Dysregulated <italic>GATA2</italic> Transcription Activates Myeloid Lineage-Specific Genes Transcription in B-ALL</title>
<p>To understand the impact of dysregulated <italic>GATA2</italic> transcription on B-ALL, we performed differential expression analysis between the <italic>GATA2</italic>-outlier group and the <italic>GATA2</italic>-normal group using DESeq2 with B-ALL subtypes as a covariate. Out of 10,505 expressed protein coding genes (FPKM &#x0003E;1 in &#x0003E;30% patients), we identified 1,150 differentially expressed genes (DEGs), including 699 up-regulated and 451 down-regulated, in <italic>GATA2</italic>-outlier cases (<italic>p</italic>-value &#x0003C; 0.05 and |fold change| &#x0003E;1.5; <xref ref-type="fig" rid="F2">Figure 2A</xref>; <xref ref-type="supplementary-material" rid="SM5">Supplementary Table 2</xref>). We firstly checked the transcription of B cell and myeloid lineage specific markers commonly tested in clinical diagnosis in the DEG result (<xref ref-type="supplementary-material" rid="SM5">Supplementary Table 3</xref>). Seven out of twelve myeloid markers used in clinical test were significantly up regulated in <italic>GATA2</italic>-outlier cases (Fisher&#x00027;s exact test, <italic>p</italic> &#x0003C; 0.001) (<xref ref-type="fig" rid="F2">Figures 2A,B</xref>), while none of the 12 myeloid markers were down-regulated. On the other hand, B-lineage markers were significantly down regulated (Fisher&#x00027;s exact test, <italic>p</italic> &#x0003C; 0.001) (<xref ref-type="fig" rid="F2">Figure 2A</xref>; <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1A</xref>) and none of these B-lineage markers showed up-regulated expression. We next performed gene set enrichment analyses on up-regulated and down-regulated DEGs separately using ToppGene tool (<xref ref-type="bibr" rid="B25">25</xref>). Consistently, the 699 up-regulated DEGs were significantly enriched in myeloid leukocyte-associated enrichment categories including both GO (terms with a <italic>p</italic>-value &#x0003C; 10<sup>&#x02212;33</sup> are listed in <xref ref-type="fig" rid="F2">Figure 2C</xref>) and ToppCell Atlas (categories with a <italic>p</italic>-value &#x0003C; 10<sup>&#x02212;33</sup> are listed in <xref ref-type="fig" rid="F2">Figure 2D</xref>), suggesting the activation of a myeloid lineage-related transcription circuit following <italic>GATA2</italic> dysregulation (<xref ref-type="bibr" rid="B15">15</xref>). In contrast, the 451 down-regulated DEGs were significantly enriched for the early B-lineage precursor cells stage (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1B</xref>) from which B-ALL leukemic cells originate. These observations indicated a potential switch from B-cell lymphocytes related transcription circuit to myeloid lineage related transcription circuit upon <italic>GATA2</italic> activation. Down-regulated DEGs were also significantly enriched for cell cycle process (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1C</xref>), implying that <italic>GATA2</italic> could be involved in the proliferation of blasts in <italic>GATA2</italic>-outlier patients.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>Effects of aberrant <italic>GATA2</italic> transcription on B-ALL. <bold>(A)</bold> Volcano plot illustrating the differentially expressed genes (DEGs) between <italic>GATA2</italic>-outlier patients and <italic>GATA2</italic>-normal patients. Gray dots indicate genes with no significant differences. Light red and light blue dots indicate 699 up-regulated and 451 down-regulated DEGs, respectively, in <italic>GATA2</italic>-outlier patients (<italic>p</italic>-value &#x0003C; 0.05 and |FC| &#x0003E; 1.5). DEGs predicted to be bound by <italic>GATA2</italic> in motif analysis are highlighted in dark red (up-regulated) and dark blue (down-regulated). DEGs overlapped with Myeloid markers and B cell markers commonly used in clinical diagnosis are highlighted in orange (up-regulated) and green (down-regulated). <bold>(B)</bold> Intersection between 699 up-regulated DEGs (left) and myeloid markers tested in clinical diagnosis (right). Seven out of 12 myeloid markers were upregulated in <italic>GATA2</italic>-outlier cases and labeled below. <bold>(C,D)</bold> Results of gene set enrichment analysis showing that 699 up-regulated DEGs are enriched in myelocyte-associated Biological Process (BP) and ToppCell Altas categories. The categories with a <italic>p</italic>-value &#x0003C; 10<sup>&#x02212;30</sup> are listed and sorted by <italic>p</italic>-value in reverse order. The color of each dot represents <italic>q</italic>-value, and the size of the dot represents the number of DEGs in each category.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fped-09-795529-g0002.tif"/>
</fig>
</sec>
<sec>
<title><italic>GATA2</italic> Activates Transcription of Tumor-Associated Genes in B-ALL</title>
<p>To investigate the targets of <italic>GATA2</italic> activation that are potentially involved in B-ALL, we combined genome-wide computational prediction of GATA family transcription factor binding motifs and the differential expression analysis described above. We first analyzed GATA2 chromatin immunoprecipitation sequencing (ChIP-seq) profiles of LNCaP cancer cell line published previously (<xref ref-type="bibr" rid="B33">33</xref>) to estimate the distance between each GATA2 binding site and its potential target gene. Only protein coding genes were included in this analysis. We found that among the GATA2 peaks with a nearby potential target gene (within 2 kb of the peak), 37.3% were located within &#x000B1;100 bp of the transcription start site (TSS) of the nearby gene (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure 2A</xref>). This suggested that GATA2 targets downstream genes by predominantly binding to the &#x000B1;100 bp of TSS region. Therefore, we scanned the TSS &#x000B1;100 bp sequences of all protein coding genes across the human genome to predict GATA2 binding sites. This resulted in the identification of 313 genes with one or more GATA family binding motifs that may be direct targets of GATA factors (<italic>p</italic>-value &#x0003C; 0.0001 with FIMO, <xref ref-type="supplementary-material" rid="SM5">Supplementary Table 4</xref>). The predictions were confirmed by gene set enrichment analysis; the 313 genes showed significant enrichment in experimentally derived GATA binding sites from the ChIP-seq analysis in ENCODE project (<xref ref-type="bibr" rid="B34">34</xref>, <xref ref-type="bibr" rid="B35">35</xref>) (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure 2B</xref>), supporting the prediction of GATA2 targets.</p>
<p>We next integrated the DEGs from differential expression analysis with the 313 targets of GATA factors from computational prediction. We identified 46 potential targets dysregulated by aberrant activation of <italic>GATA2</italic>, including 13 down-regulated DEGs (<xref ref-type="supplementary-material" rid="SM2">Supplementary Figure 2C</xref>) and 33 up-regulated DEGs (<xref ref-type="fig" rid="F3">Figure 3A</xref>; <xref ref-type="supplementary-material" rid="SM5">Supplementary Table 2</xref>). We focused on the up-regulated DEGs in this analysis. Notably, there were several known tumor-associated genes (highlighted in <xref ref-type="fig" rid="F2">Figure 2A</xref>) among these 33 target genes, including <italic>BAG3, EPOR</italic>, and <italic>KLF1</italic>. <italic>BAG3</italic>, which was reported to be an anti-apoptotic gene involved in leukemic cell survival and response to therapy (<xref ref-type="bibr" rid="B36">36</xref>), was among the most significant DEGs between <italic>GATA2</italic>-outlier and <italic>GATA2</italic>-normal B-ALL patients (<italic>p</italic>-value = 7.9 &#x000D7; 10<sup>&#x02212;14</sup>; log2FC = 3.4, <xref ref-type="fig" rid="F3">Figure 3B</xref>). And there was a significant positive correlation between <italic>GATA2</italic> and <italic>BAG3</italic> transcription in B-ALL (<italic>r</italic> = 0.35, <italic>p</italic>-value = 3.09e-18, <xref ref-type="fig" rid="F3">Figure 3C</xref>). Furthermore, GATA2 binding was observed in ChIP-seq experiments from multiple tumor cell lines, namely LNCaP, HUVEC, SHSY5Y, and K562 (<xref ref-type="fig" rid="F3">Figure 3D</xref>). Taken together, these observations support the hypothesis that <italic>BAG3</italic> is a target of aberrantly activated <italic>GATA2</italic> in B-ALL. Similar observations were made for <italic>EPOR</italic> and <italic>KLF1</italic>; both genes showed significant co-expression with <italic>GATA2</italic> (<xref ref-type="fig" rid="F3">Figure 3C</xref>) and positive GATA2 binding observed for multiple cancer cell lines in ChIP-seq experiments (<xref ref-type="fig" rid="F3">Figure 3D</xref>). <italic>EPOR</italic> is a well-established B-ALL-associated gene whose abnormal activation in pre-B cells increases cell survival by activating the JAK-STAT pathway (<xref ref-type="bibr" rid="B37">37</xref>), whereas <italic>KLF1</italic> is associated with poor survival in AML (<xref ref-type="bibr" rid="B38">38</xref>). The up-regulation of these genes by <italic>GATA2</italic> activation may play a tumor-promoting role in leukemia and reinforce the potential function of <italic>GATA2</italic> in leukemogenesis in B-ALL.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Potential targets of <italic>GATA2</italic> activation. <bold>(A)</bold> The overlap between potential <italic>GATA2</italic>-targeted genes predicted by FIMO (left) and up-regulated DEGs (right). <bold>(B)</bold> Violin plots showing the normalized expression of the potential <italic>GATA2</italic>-targeted genes <italic>BAG3, EPOR</italic>, and <italic>KLF1</italic> in the <italic>GATA2</italic>-outlier and <italic>GATA2</italic>-normal groups. The <italic>p</italic>-value from differential expression analysis is shown above each plot. <bold>(C)</bold> Scatter plots indicating the correlations between normalized expression levels of <italic>GATA2</italic> (x axis) and the potential target genes (y axis). The correlation coefficient and <italic>p</italic>-value were determined by Pearson correlation analysis. <bold>(D)</bold> Wiggle plot of GATA2 ChIP-seq data from four tumor cell lines showing that the GATA2-binding site is located near the potential target genes in <bold>(B)</bold>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fped-09-795529-g0003.tif"/>
</fig>
</sec>
<sec>
<title>Trans- and Cis-Activation of <italic>GATA2</italic> in B-ALL</title>
<p>In the 13 <italic>GATA2</italic>-outlier B-ALL patients, two were MLL subtype (SJBALL021549_D1 and SJINF066_D). Notably, we found that both patients carried the same <italic>KMT2A-USP2</italic> fusion. Further checking confirmed that these patients were the only two carrying this fusion in the cohort analyzed (<xref ref-type="supplementary-material" rid="SM5">Supplementary Table 1</xref>), indicating that <italic>GATA2</italic> could be trans-activated by KMT2A-USP2. <italic>KMT2A-USP2</italic> is a relatively rare type of <italic>KMT2A</italic> rearrangement and was recently reported as a recurrent fusion in pediatric B-ALL (<xref ref-type="bibr" rid="B39">39</xref>). In the two cases identified in this analysis, the breakpoint of the fusion was located within intron 22 of <italic>KMT2A</italic> (NM_005933) and intron 2 of <italic>USP2</italic> (NM_004205), which resulted in an in-frame fusion consisting of exons 1&#x02013;21 of <italic>KMT2A</italic> and exons 3&#x02013;13 of <italic>USP2</italic> (<xref ref-type="supplementary-material" rid="SM3">Supplementary Figure 3</xref>). The fusion protein contains the entire deubiquitination domain of USP2, indicating that USP2 might be the functional executor of this chimeric protein. Interestingly, wild-type <italic>USP2</italic> was not transcribed in majority of B-ALL patients (<xref ref-type="fig" rid="F4">Figure 4A</xref>) and could be activated through fusion with <italic>KMT2A</italic> (<xref ref-type="fig" rid="F4">Figure 4B</xref>), with active transcription of <italic>USP2</italic> occurring through hijacking of the <italic>KMT2A</italic> promoter (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 3</xref>). In addition, we found high levels of wild-type <italic>USP2</italic> transcription in couple of B-ALL patients with other MLL subtype (<xref ref-type="fig" rid="F4">Figures 4A,B</xref>), indicating <italic>USP2</italic> could also be aberrantly activated in <italic>KMT2A</italic> rearranged B-ALL. Notably, <italic>GATA2</italic> outlier expression was found in patients with the <italic>KMT2A-USP2</italic> fusion but not in other <italic>KMT2A</italic> rearranged patients with high expression of wild-type <italic>USP2</italic> (<xref ref-type="fig" rid="F4">Figure 4C</xref>), suggesting that <italic>GATA2</italic> transcription was activated by the chimeric fusion protein as a whole.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>The <italic>KMT2A-USP2</italic> fusion activates <italic>GATA2</italic> in B-ALL. <bold>(A)</bold> The expression of <italic>USP2</italic> in 629 B-ALL patients across 11 subtypes. Six MLL B-ALL patients with <italic>USP2</italic> FPKM values &#x0003E;5 are labeled with the corresponding sample IDs. Two patients with the <italic>KMT2A-USP2</italic> fusion are highlighted in red. <bold>(B)</bold> Boxplot showing <italic>USP2</italic> transcription in patients with the MLL subtype of B-ALL. Cases were further divided into groups according to <italic>KMT2A</italic> fusion partner. Six <italic>USP2</italic>-positive MLL cases are labeled and color coded as in <bold>(A)</bold>. <bold>(C)</bold> The expression of <italic>GATA2</italic> across different fusion partner groups in MLL subtypes as shown in <bold>(B)</bold>.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fped-09-795529-g0004.tif"/>
</fig>
<p>Meanwhile, we were able to identify another MLL B-ALL case, SJALL043839_D1, with aberrant <italic>GATA2</italic> transcription from a previously published ALL cohort (<xref ref-type="bibr" rid="B27">27</xref>), in which both RNA-seq and whole-genome sequencing (WGS) data were available for tumor cells. By integrating WGS and RNA-seq data with cis-X (<xref ref-type="bibr" rid="B28">28</xref>), we found significant allele-specific expression (ASE, <xref ref-type="fig" rid="F5">Figure 5A</xref>) as well as outlier expression of <italic>GATA2</italic> in this case compared with the remaining B-ALL patients from the same cohort (<xref ref-type="fig" rid="F5">Figure 5B</xref>). Further analysis identified a somatically acquired 101 kb focal deletion located 285 kb downstream of the TSS of <italic>GATA2</italic> in the tumor cells (<xref ref-type="fig" rid="F5">Figure 5C</xref>). Notably, <italic>GATA2</italic> was the only cis-activated gene in the genomic neighborhood surrounding this deletion (<xref ref-type="supplementary-material" rid="SM4">Supplementary Figures 4A&#x02013;C</xref>), indicating that <italic>GATA2</italic> was the target. Furthermore, <italic>in-situ</italic> high-through chromosome conformation capture (Hi-C) data for both the B-ALL cell line Nalm6 and neuroblastoma cell line Kelly (<xref ref-type="fig" rid="F5">Figure 5C</xref>) from GenomePaint (<xref ref-type="bibr" rid="B30">30</xref>) showed that the deletion overlapped with the boundary of topologically associating domain (TAD) harboring <italic>GATA2</italic>. Disruption of the TAD structure by the deletion might aberrantly connect the <italic>GATA2</italic> promoter to the active regulatory DNA elements in the adjacent TAD, thus contributing to <italic>GATA2</italic> dysregulation in cis.</p>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Cis-activation of <italic>GATA2</italic> due to a downstream focal deletion. <bold>(A)</bold> Allelic specific expression of <italic>GATA2</italic> in SJALL043839_D1 was determined by examining the mono-allelic expression of six heterozygous germline/somatic variants, which are labeled above the wiggle plot, with blue and red representing the reference and alternative alleles, respectively. <bold>(B)</bold> Outlier high expression (FPKM on the y axis) of <italic>GATA2</italic> was found in sample SJALL043839_D1 (red dot) from the Shanghai Children&#x00027;s Medical Center ALL cohort. <bold>(C)</bold> Focal deletion activating GATA2 in SJALL043839_D1. Topologically associating domains from Hi-C data of the Nalm6 and Kelly cell lines are displayed on the top; both pictures show a wild-type 3-D genome architecture at the <italic>GATA2</italic> locus. A somatic focal deletion was identified in the tumor cells of SJALL043839_D1; the deletion is shown at the bottom with a wiggle plot showing the coverage from whole-genome sequencing data of tumor and matched remission samples. The deletion is indicated by boxes above the wiggle plot, which represent the copy number variation (CNV, log<sub>2</sub>Ratio = &#x02212;0.75) and the loss of heterozygosity (LOH, segment mean value = 0.32). The focal deletion and the candidate TAD boundary disrupted by the deletion are highlighted in yellow. The whole-genome sequencing and Hi-C data were visualized with GenomePaint (<xref ref-type="bibr" rid="B30">30</xref>) (<ext-link ext-link-type="uri" xlink:href="https://genomepaint.stjude.cloud/">https://genomepaint.stjude.cloud/</ext-link>).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fped-09-795529-g0005.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>The expression of transcription factors is strictly regulated during development, both spatially and temporally. Aberrant activation of transcription factors is one of the most common drivers in ALL (<xref ref-type="bibr" rid="B9">9</xref>, <xref ref-type="bibr" rid="B40">40</xref>). <italic>GATA2</italic> is actively expressed in multipotent progenitors, erythroid precursors, and myeloid precursors, but not in lymphoid precursors or B-ALL (<xref ref-type="bibr" rid="B16">16</xref>, <xref ref-type="bibr" rid="B41">41</xref>). In the present study, we first reported low expression of <italic>GATA2</italic> in the majority of B-ALL patients, which was consistent with the origination of this tumor from the early developmental stage of B lymphoid. On the other hand, we showed that <italic>GATA2</italic> was actively transcribed in a subset of B-ALL patients, especially in those with the ETV subtype (<xref ref-type="fig" rid="F1">Figure 1B</xref>). The transcription of <italic>GATA2</italic> in ETV-subtype B-ALL patients is supported by a recent study carried out with the B-ALL cell lines REH and Nalm6, which belong to the ETV and DUX4 subtypes respectively, suggesting potential association between <italic>GATA2</italic> transcription and gene methylation (<xref ref-type="bibr" rid="B42">42</xref>). In addition, we discovered 13 B-ALL cases with aberrant <italic>GATA2</italic> activation from 629 B-ALL patients, indicating that <italic>GATA2</italic> dysregulation is a shared feature of different B-ALL subtypes. Cluster analysis based on 1150 DEGs between <italic>GATA2</italic>-outlier cases and <italic>GATA2</italic>-normal cases showed that patients could not be grouped by <italic>GATA2</italic> transcription level (<xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1D</xref>). This was partially because of the limited number of <italic>GATA2</italic> outlier cases included in this analysis, but it also indicated that <italic>GATA2</italic> activation was a secondary event in B-ALL and would need to cooperate with other driver genomic aberrations in leukemogenesis. Further investigations including more B-ALL cases with <italic>GATA2</italic> activation are needed to unveil detailed co-occurrence relationship between <italic>GATA2</italic> activation and other driver genomic aberrations. Meanwhile, the myeloid-specific gene signature observed in these cases indicated that <italic>GATA2</italic> activation rewires gene transcription circuits in B-ALL cells toward myeloid-like (<xref ref-type="fig" rid="F2">Figures 2C,D</xref>), which is consistent with the expression of <italic>GATA2</italic> in early myeloid precursors (<xref ref-type="bibr" rid="B43">43</xref>). On the other hand, it was reported that <italic>GATA2</italic> deficiency restricts cell proliferation in AML cells and delays leukemogenesis in <italic>Cbfb-Myh11</italic> knock-in mice, supporting the notion that <italic>GATA2</italic> is a poor prognostic marker in pediatric AML (<xref ref-type="bibr" rid="B22">22</xref>). Indeed, we found that several up-regulated DEGs targeted by <italic>GATA2</italic> in the <italic>GATA2</italic>-outlier B-ALL cases were known tumor-associated genes (<xref ref-type="fig" rid="F2">Figure 2A</xref>), including <italic>BAG3</italic> and <italic>EPOR</italic>. This provides further evidence for the potential tumor promoting function of <italic>GATA2</italic> in B-ALL.</p>
<p>The two MLL subtype patients (SJBALL021549_D1 and SJINF066_D) with <italic>GATA2</italic> activation both carried the <italic>KMT2A</italic>-<italic>USP2</italic> fusion, which is rare in B-ALL and its function has been largely unexplored. Although patient SJINF066 was an infant (9-month-old) and SJBALL021549_D1 was a 9-year-old child, the expression levels of <italic>GATA2</italic> in these two cases were comparable, indicating that trans-activation of <italic>GATA2</italic> by KMT2A-USP2 is not influenced by age but rather by the function of this fusion. Different from other common <italic>KMT2A</italic> rearrangements with breakpoints located in the major breakpoint cluster region (BCR), the <italic>KMT2A</italic>-<italic>USP2</italic> breakpoint appeared to be inside the minor BCR and joined the plant homeodomain (PHD) domain of KMT2A with the conserved ubiquitin carboxyl-terminal hydrolase (UCH) domain of USP2 (<xref ref-type="bibr" rid="B39">39</xref>). The biological function of <italic>KMT2A-USP2</italic> in ALL is still unclear. Available hypotheses have mainly focused on the function of USP2 including USP2-mediated deubiquitination of KMT2A and cell cycle-related cyclin proteins (<xref ref-type="bibr" rid="B39">39</xref>, <xref ref-type="bibr" rid="B44">44</xref>). However, we noticed that high expression of wild-type <italic>USP2</italic> did not result in aberrant <italic>GATA2</italic> transcription (<xref ref-type="fig" rid="F4">Figure 4C</xref>), indicating that both parts of the KMT2A-USP2 fusion protein contribute to <italic>GATA2</italic> activation. Considering that the <italic>KMT2A</italic> fusion trans-activates <italic>HOX</italic> genes by directly binding to <italic>HOX</italic> loci (<xref ref-type="bibr" rid="B45">45</xref>) and that histone H2A ubiquitination plays a critical function in polycomb-mediated transcriptional repression (<xref ref-type="bibr" rid="B46">46</xref>, <xref ref-type="bibr" rid="B47">47</xref>), it is likely that USP2 is relocated to the nucleus by the KMT2A-USP2 fusion and contributes to trans-activation of <italic>GATA2</italic> transcription through deubiquitinating H2A and further disrupting gene silencing maintained by polycomb group complexes. Further experiments are needed to investigate the molecular mechanism. In a previously published study of a cohort of 11 pediatric B-ALL patients with the <italic>KMT2A-USP2</italic> fusion, three patients presented with central nervous system disease and 8 patients had positive-minimal residual disease at day 33, suggesting a poor prognosis of patients carrying this fusion (<xref ref-type="bibr" rid="B39">39</xref>). Our results identifying <italic>GATA2</italic> as a potentially novel target of the KMT2A-USP2 fusion might provide novel clues for understanding the function of this fusion.</p>
<p>Our data showed that in addition to the trans-activation of <italic>GATA2</italic> by the KMT2A-USP2 fusion, a cis-activating mechanism is also involved in <italic>GATA2</italic> dysregulation. ASE and high outlier expression of <italic>GATA2</italic> were found in one B-ALL patient with a somatic focal deletion detected downstream of <italic>GATA2</italic> (<xref ref-type="fig" rid="F5">Figures 5A,B</xref>). Hi-C data from Nalm6 and Kelly cell lines verified that the candidate insulated boundaries were potentially disrupted by the deletion (<xref ref-type="fig" rid="F5">Figure 5C</xref>). The evidence confirmed that the focal deletion altered the conserved three-dimensional genome structure thus cis-activating <italic>GATA2</italic> in B-ALL. This mechanism is similar to the activation of other oncogenes including <italic>TAL1</italic> and <italic>LMO2</italic> by disruption of TADs (<xref ref-type="bibr" rid="B48">48</xref>). Interestingly, SJALL043839_D1 is also a MLL B-ALL (<italic>KMT2A-MLLT3</italic>). As the <italic>KMT2A</italic> rearrangement was an unfavorable prognostic factor (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>) in ALL, further investigation of the potential interplay of aberrant <italic>GATA2</italic> transcription and <italic>KMT2A</italic> fusions might shed new light on the molecular basis of this subtype of B-ALL.</p>
<p>Taken together, our study revealed aberrant <italic>GATA2</italic> activation in B-ALL patients. Abnormal <italic>GATA2</italic> transcription makes B-ALL tumor cells more myeloid-like and could contribute to leukemogenesis by activating downstream target genes.</p>
</sec>
<sec sec-type="data-availability" id="s5">
<title>Data Availability Statement</title>
<p>The RNA-seq data for the St. Jude leukemia patients (297 AML cases, 99 T-ALL cases, and 1248 B-ALL cases) were downloaded from St. Jude cloud (<ext-link ext-link-type="uri" xlink:href="https://www.stjude.cloud">https://www.stjude.cloud</ext-link>). The GATA2 ChIP-seq data used in this study can be accessed from the gene expression omnibus under accession nos. <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GSM1600544">GSM1600544</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GSM935347">GSM935347</ext-link>, <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GSM935589">GSM935589</ext-link>, and <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GSM935373">GSM935373</ext-link> for LNCaP, HUVEC, SHSY5Y, and K562 cells, respectively, with the called peaks (in BED format) available upon request. Whole-genome sequencing and RNA-seq data for SJALL043839_D1 are available in St. Jude Cloud GenomePaint (<ext-link ext-link-type="uri" xlink:href="https://genomepaint.stjude.cloud/">https://genomepaint.stjude.cloud/</ext-link>). The Hi-C data of Nalm6 and Kelly cell lines are also available from St. Jude Cloud GenomePaint.</p>
</sec>
<sec id="s6">
<title>Author Contributions</title>
<p>HW, BC, and HS performed statistical analysis. FZ collected clinical information. JR, RW, and SZ analyzed the genomic data of SJALL043839_D1. SS and YL designed and supervised the study. HW and YL wrote the manuscript. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>This work was supported by the National Natural Science Foundation of China (31970627 to YL) and Shanghai Key Laboratory of Clinical Molecular Diagnostics for Pediatrics (20dz2260900 to YL).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s8">
<title>Publisher&#x00027;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec sec-type="supplementary-material" id="s9">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fped.2021.795529/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fped.2021.795529/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Image_1.TIF" id="SM1" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 1</label>
<caption><p>The effect of <italic>GATA2</italic> activation on differentially expressed genes in B-ALL. <bold>(A)</bold> Intersection between down-regulated DEGs (left) and B cell markers (right). Three out of five B cell markers were down regulated in <italic>GATA2</italic>-outlier cases and listed below. <bold>(B)</bold> A total of 451 down-regulated DEGs were enriched in pre-B or pro-B lymphoid cell-related categories in the ToppCell Atlas. Significantly enriched categories (<italic>p</italic>-value &#x0003C; 10<sup>&#x02212;15</sup>) are shown. <bold>(C)</bold> Gene Ontology enrichment results for 451 down-regulated DEGs; categories are associated with the cell cycle. The categories with a <italic>p</italic>-value &#x0003C; 10<sup>&#x02212;7</sup> are shown and sorted by <italic>p</italic>-value in reverse order. <bold>(D)</bold> Cluster analysis of <italic>GATA2</italic>-outlier (<italic>n</italic> = 13, big circles) and <italic>GATA2</italic>-normal samples (<italic>n</italic> = 571, small circles) using 1150 DEGs from differential expression analysis. The results are shown as a t-SNE plot. Each dot represents an individual B-ALL patient and the color indicates the B-ALL subtype.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_2.TIF" id="SM2" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 2</label>
<caption><p>Prediction of <italic>GATA2</italic> targets. <bold>(A)</bold> Distribution of distances between <italic>GATA2</italic> peaks and the nearest TSS of a gene in the GATA2 ChIP-seq from LNCaP (GSE38391). Only peaks within the promoter region (&#x02212;1000 to &#x0002B;1000 bp) of at least one protein coding gene were included. <bold>(B)</bold> The enrichment results of 313 potential GATA-targeted genes. The number of target genes in each enriched category is shown on the x-axis. The color represents the <italic>p</italic>-value. <bold>(C)</bold> Intersection of potential <italic>GATA2</italic> target genes predicted by FIMO (left) and DEGs down-regulated upon <italic>GATA2</italic> activation (right).</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_3.TIF" id="SM3" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 3</label>
<caption><p><italic>KMT2A-USP2</italic> fusion in MLL B-ALL patients with outlier <italic>GATA2</italic> transcription. Protein diagrams were generated using ProteinPaint (<xref ref-type="bibr" rid="B29">29</xref>) (<ext-link ext-link-type="uri" xlink:href="https://proteinpaint.stjude.org/">https://proteinpaint.stjude.org/</ext-link>).</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Image_4.TIF" id="SM4" mimetype="image/tif" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Figure 4</label>
<caption><p>The transcription of genes near the deletion downstream of <italic>GATA2</italic>. The expression levels of <italic>EEFSEC</italic> <bold>(A)</bold>, <italic>RUBBL1</italic> <bold>(B)</bold>, and <italic>SEC61A1</italic> <bold>(C)</bold> in B-ALL patients from the Shanghai Children&#x00027;s Medical Center ALL cohort are shown as scatterplots. Expression level (FPKM) is plotted on the y-axis. The case with cis-activated <italic>GATA2</italic> (SJALL043839_D1) is highlighted in red in each panel.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Data_Sheet_1.xlsx" id="SM5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kato</surname> <given-names>M</given-names></name> <name><surname>Manabe</surname> <given-names>A</given-names></name></person-group>. <article-title>Treatment and biology of pediatric acute lymphoblastic leukemia</article-title>. <source>Pediatr Int.</source> (<year>2018</year>) <volume>60</volume>:<fpage>4</fpage>&#x02013;<lpage>12</lpage>. <pub-id pub-id-type="doi">10.1111/ped.13457</pub-id><pub-id pub-id-type="pmid">29143423</pub-id></citation></ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hunger</surname> <given-names>SP</given-names></name> <name><surname>Mullighan</surname> <given-names>CG</given-names></name></person-group>. <article-title>Acute lymphoblastic leukemia in children</article-title>. <source>N Engl J Med.</source> (<year>2015</year>) <volume>373</volume>:<fpage>1541</fpage>&#x02013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMra1400972</pub-id><pub-id pub-id-type="pmid">26465987</pub-id></citation></ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Van Vlierberghe</surname> <given-names>P</given-names></name> <name><surname>Ferrando</surname> <given-names>A</given-names></name></person-group>. <article-title>The molecular basis of T cell acute lymphoblastic leukemia</article-title>. <source>J Clin Invest.</source> (<year>2012</year>) <volume>122</volume>:<fpage>3398</fpage>&#x02013;<lpage>406</lpage>. <pub-id pub-id-type="doi">10.1172/JCI61269</pub-id><pub-id pub-id-type="pmid">23023710</pub-id></citation></ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Arico</surname> <given-names>M</given-names></name> <name><surname>Valsecchi</surname> <given-names>MG</given-names></name> <name><surname>Camitta</surname> <given-names>B</given-names></name> <name><surname>Schrappe</surname> <given-names>M</given-names></name> <name><surname>Chessells</surname> <given-names>J</given-names></name> <name><surname>Baruchel</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>Outcome of treatment in children with Philadelphia chromosome-positive acute lymphoblastic leukemia</article-title>. <source>N Engl J Med.</source> (<year>2000</year>) <volume>342</volume>:<fpage>998</fpage>&#x02013;<lpage>1006</lpage>. <pub-id pub-id-type="doi">10.1056/NEJM200004063421402</pub-id><pub-id pub-id-type="pmid">26457281</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pui</surname> <given-names>CH</given-names></name> <name><surname>Carroll</surname> <given-names>WL</given-names></name> <name><surname>Meshinchi</surname> <given-names>S</given-names></name> <name><surname>Arceci</surname> <given-names>RJ</given-names></name></person-group>. <article-title>Biology, risk stratification, and therapy of pediatric acute leukemias: an update</article-title>. <source>J Clin Oncol.</source> (<year>2011</year>) <volume>29</volume>:<fpage>551</fpage>&#x02013;<lpage>65</lpage>. <pub-id pub-id-type="doi">10.1200/JCO.2010.30.7405</pub-id><pub-id pub-id-type="pmid">21220611</pub-id></citation></ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Milne</surname> <given-names>TA</given-names></name></person-group>. <article-title>Mouse models of MLL leukemia: recapitulating the human disease</article-title>. <source>Blood.</source> (<year>2017</year>) <volume>129</volume>:<fpage>2217</fpage>&#x02013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2016-10-691428</pub-id><pub-id pub-id-type="pmid">28179274</pub-id></citation></ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roberts</surname> <given-names>KG</given-names></name></person-group>. <article-title>Genetics and prognosis of ALL in children vs adults</article-title>. <source>Hematol Am Soc Hematol Educ Program.</source> (<year>2018</year>) <volume>2018</volume>:<fpage>137</fpage>&#x02013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1182/asheducation-2018.1.137</pub-id><pub-id pub-id-type="pmid">30504302</pub-id></citation></ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iacobucci</surname> <given-names>I</given-names></name> <name><surname>Mullighan</surname> <given-names>CG</given-names></name></person-group>. <article-title>Genetic basis of acute lymphoblastic leukemia</article-title>. <source>J Clin Oncol.</source> (<year>2017</year>) <volume>35</volume>:<fpage>975</fpage>&#x02013;<lpage>83</lpage>. <pub-id pub-id-type="doi">10.1200/JCO.2016.70.7836</pub-id><pub-id pub-id-type="pmid">28297628</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Somasundaram</surname> <given-names>R</given-names></name> <name><surname>Prasad</surname> <given-names>MA</given-names></name> <name><surname>Ungerback</surname> <given-names>J</given-names></name> <name><surname>Sigvardsson</surname> <given-names>M</given-names></name></person-group>. <article-title>Transcription factor networks in B-cell differentiation link development to acute lymphoid leukemia</article-title>. <source>Blood.</source> (<year>2015</year>) <volume>126</volume>:<fpage>144</fpage>&#x02013;<lpage>52</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2014-12-575688</pub-id><pub-id pub-id-type="pmid">25990863</pub-id></citation></ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mullighan</surname> <given-names>CG</given-names></name> <name><surname>Goorha</surname> <given-names>S</given-names></name> <name><surname>Radtke</surname> <given-names>I</given-names></name> <name><surname>Miller</surname> <given-names>CB</given-names></name> <name><surname>Coustan-Smith</surname> <given-names>E</given-names></name> <name><surname>Dalton</surname> <given-names>JD</given-names></name> <etal/></person-group>. <article-title>Genome-wide analysis of genetic alterations in acute lymphoblastic leukaemia</article-title>. <source>Nature.</source> (<year>2007</year>) <volume>446</volume>:<fpage>758</fpage>&#x02013;<lpage>64</lpage>. <pub-id pub-id-type="doi">10.1038/nature05690</pub-id><pub-id pub-id-type="pmid">17344859</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gu</surname> <given-names>Z</given-names></name> <name><surname>Churchman</surname> <given-names>ML</given-names></name> <name><surname>Roberts</surname> <given-names>KG</given-names></name> <name><surname>Moore</surname> <given-names>I</given-names></name> <name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>Nakitandwe</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>PAX5-driven subtypes of B-progenitor acute lymphoblastic leukemia</article-title>. <source>Nat Genet.</source> (<year>2019</year>) <volume>51</volume>:<fpage>296</fpage>&#x02013;<lpage>307</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-018-0315-5</pub-id><pub-id pub-id-type="pmid">30643249</pub-id></citation></ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mullighan</surname> <given-names>CG</given-names></name> <name><surname>Su</surname> <given-names>X</given-names></name> <name><surname>Zhang</surname> <given-names>J</given-names></name> <name><surname>Radtke</surname> <given-names>I</given-names></name> <name><surname>Phillips</surname> <given-names>LA</given-names></name> <name><surname>Miller</surname> <given-names>CB</given-names></name> <etal/></person-group>. <article-title>Deletion of IKZF1 and prognosis in acute lymphoblastic leukemia</article-title>. <source>N Engl J Med.</source> (<year>2009</year>) <volume>360</volume>:<fpage>470</fpage>&#x02013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMoa0808253</pub-id><pub-id pub-id-type="pmid">19129520</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Belver</surname> <given-names>L</given-names></name> <name><surname>Ferrando</surname> <given-names>A</given-names></name></person-group>. <article-title>The genetics and mechanisms of T cell acute lymphoblastic leukaemia</article-title>. <source>Nat Rev Cancer.</source> (<year>2016</year>) <volume>16</volume>:<fpage>494</fpage>&#x02013;<lpage>507</lpage>. <pub-id pub-id-type="doi">10.1038/nrc.2016.63</pub-id><pub-id pub-id-type="pmid">27451956</pub-id></citation></ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>Y</given-names></name> <name><surname>Easton</surname> <given-names>J</given-names></name> <name><surname>Shao</surname> <given-names>Y</given-names></name> <name><surname>Maciaszek</surname> <given-names>J</given-names></name> <name><surname>Wang</surname> <given-names>Z</given-names></name> <name><surname>Wilkinson</surname> <given-names>MR</given-names></name> <etal/></person-group>. <article-title>The genomic landscape of pediatric and young adult T-lineage acute lymphoblastic leukemia</article-title>. <source>Nat Genet.</source> (<year>2017</year>) <volume>49</volume>:<fpage>1211</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3909</pub-id><pub-id pub-id-type="pmid">28671688</pub-id></citation></ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Crispino</surname> <given-names>JD</given-names></name> <name><surname>Horwitz</surname> <given-names>MS</given-names></name></person-group>. <article-title>GATA factor mutations in hematologic disease</article-title>. <source>Blood.</source> (<year>2017</year>) <volume>129</volume>:<fpage>2103</fpage>&#x02013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2016-09-687889</pub-id><pub-id pub-id-type="pmid">28179280</pub-id></citation></ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bresnick</surname> <given-names>EH</given-names></name> <name><surname>Lee</surname> <given-names>HY</given-names></name> <name><surname>Fujiwara</surname> <given-names>T</given-names></name> <name><surname>Johnson</surname> <given-names>KD</given-names></name> <name><surname>Keles</surname> <given-names>S</given-names></name></person-group>. <article-title>GATA switches as developmental drivers</article-title>. <source>J Biol Chem.</source> (<year>2010</year>) <volume>285</volume>:<fpage>31087</fpage>&#x02013;<lpage>93</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.R110.159079</pub-id><pub-id pub-id-type="pmid">20670937</pub-id></citation></ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Menendez-Gonzalez</surname> <given-names>JB</given-names></name> <name><surname>Vukovic</surname> <given-names>M</given-names></name> <name><surname>Abdelfattah</surname> <given-names>A</given-names></name> <name><surname>Saleh</surname> <given-names>L</given-names></name> <name><surname>Almotiri</surname> <given-names>A</given-names></name> <name><surname>Thomas</surname> <given-names>LA</given-names></name> <etal/></person-group>. <article-title>Gata2 as a crucial regulator of stem cells in adult hematopoiesis and acute myeloid leukemia</article-title>. <source>Stem Cell Reports.</source> (<year>2019</year>) <volume>13</volume>:<fpage>291</fpage>&#x02013;<lpage>306</lpage>. <pub-id pub-id-type="doi">10.1016/j.stemcr.2019.07.005</pub-id><pub-id pub-id-type="pmid">31378673</pub-id></citation></ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fransecky</surname> <given-names>L</given-names></name> <name><surname>Neumann</surname> <given-names>M</given-names></name> <name><surname>Heesch</surname> <given-names>S</given-names></name> <name><surname>Schlee</surname> <given-names>C</given-names></name> <name><surname>Ortiz-Tanchez</surname> <given-names>J</given-names></name> <name><surname>Heller</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Silencing of GATA3 defines a novel stem cell-like subgroup of ETP-ALL</article-title>. <source>J Hematol Oncol.</source> (<year>2016</year>) <volume>9</volume>:<fpage>95</fpage>. <pub-id pub-id-type="doi">10.1186/s13045-016-0324-8</pub-id><pub-id pub-id-type="pmid">27658391</pub-id></citation></ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>J</given-names></name> <name><surname>Ding</surname> <given-names>L</given-names></name> <name><surname>Holmfeldt</surname> <given-names>L</given-names></name> <name><surname>Wu</surname> <given-names>G</given-names></name> <name><surname>Heatley</surname> <given-names>SL</given-names></name> <name><surname>Payne-Turner</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>The genetic basis of early T-cell precursor acute lymphoblastic leukaemia</article-title>. <source>Nature.</source> (<year>2012</year>) <volume>481</volume>:<fpage>157</fpage>&#x02013;<lpage>63</lpage>. <pub-id pub-id-type="doi">10.1038/nature10725</pub-id><pub-id pub-id-type="pmid">22237106</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gao</surname> <given-names>J</given-names></name> <name><surname>Gentzler</surname> <given-names>RD</given-names></name> <name><surname>Timms</surname> <given-names>AE</given-names></name> <name><surname>Horwitz</surname> <given-names>MS</given-names></name> <name><surname>Frankfurt</surname> <given-names>O</given-names></name> <name><surname>Altman</surname> <given-names>JK</given-names></name> <etal/></person-group>. <article-title>Heritable GATA2 mutations associated with familial AML-MDS: a case report and review of literature</article-title>. <source>J Hematol Oncol.</source> (<year>2014</year>) <volume>7</volume>:<fpage>36</fpage>. <pub-id pub-id-type="doi">10.1186/1756-8722-7-36</pub-id><pub-id pub-id-type="pmid">26715529</pub-id></citation></ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katayama</surname> <given-names>S</given-names></name> <name><surname>Suzuki</surname> <given-names>M</given-names></name> <name><surname>Yamaoka</surname> <given-names>A</given-names></name> <name><surname>Keleku-Lukwete</surname> <given-names>N</given-names></name> <name><surname>Katsuoka</surname> <given-names>F</given-names></name> <name><surname>Otsuki</surname> <given-names>A</given-names></name> <etal/></person-group>. <article-title>GATA2 haploinsufficiency accelerates EVI1-driven leukemogenesis</article-title>. <source>Blood.</source> (<year>2017</year>) <volume>130</volume>:<fpage>908</fpage>&#x02013;<lpage>19</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2016-12-756767</pub-id><pub-id pub-id-type="pmid">28630119</pub-id></citation></ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Luesink</surname> <given-names>M</given-names></name> <name><surname>Hollink</surname> <given-names>IH</given-names></name> <name><surname>Van Der Velden</surname> <given-names>VH</given-names></name> <name><surname>Knops</surname> <given-names>RH</given-names></name> <name><surname>Boezeman</surname> <given-names>JB</given-names></name> <name><surname>De Haas</surname> <given-names>V</given-names></name> <etal/></person-group>. <article-title>High GATA2 expression is a poor prognostic marker in pediatric acute myeloid leukemia</article-title>. <source>Blood.</source> (<year>2012</year>) <volume>120</volume>:<fpage>2064</fpage>&#x02013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2011-12-397083</pub-id><pub-id pub-id-type="pmid">22786876</pub-id></citation></ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>McLeod</surname> <given-names>C</given-names></name> <name><surname>Gout</surname> <given-names>AM</given-names></name> <name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>Thrasher</surname> <given-names>A</given-names></name> <name><surname>Rahbarinia</surname> <given-names>D</given-names></name> <name><surname>Brady</surname> <given-names>SW</given-names></name> <etal/></person-group>. <article-title>St. Jude Cloud: a pediatric cancer genomic data-sharing ecosystem</article-title>. <source>Cancer Discov.</source> (<year>2021</year>) <volume>11</volume>:<fpage>1082</fpage>&#x02013;<lpage>99</lpage>. <pub-id pub-id-type="doi">10.1158/2159-8290.CD-20-1230</pub-id><pub-id pub-id-type="pmid">33408242</pub-id></citation></ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Love</surname> <given-names>MI</given-names></name> <name><surname>Huber</surname> <given-names>W</given-names></name> <name><surname>Anders</surname> <given-names>S</given-names></name></person-group>. <article-title>Moderated estimation of fold change and dispersion for RNA-seq data with DESeq2</article-title>. <source>Genome Biol.</source> (<year>2014</year>) <volume>15</volume>:<fpage>550</fpage>. <pub-id pub-id-type="doi">10.1186/s13059-014-0550-8</pub-id><pub-id pub-id-type="pmid">25516281</pub-id></citation></ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>J</given-names></name> <name><surname>Bardes</surname> <given-names>EE</given-names></name> <name><surname>Aronow</surname> <given-names>BJ</given-names></name> <name><surname>Jegga</surname> <given-names>AG</given-names></name></person-group>. <article-title>ToppGene suite for gene list enrichment analysis and candidate gene prioritization</article-title>. <source>Nucleic Acids Res.</source> (<year>2009</year>) <volume>37</volume>:<fpage>W305</fpage>&#x02013;<lpage>311</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkp427</pub-id><pub-id pub-id-type="pmid">19465376</pub-id></citation></ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bailey</surname> <given-names>TL</given-names></name> <name><surname>Boden</surname> <given-names>M</given-names></name> <name><surname>Buske</surname> <given-names>FA</given-names></name> <name><surname>Frith</surname> <given-names>M</given-names></name> <name><surname>Grant</surname> <given-names>CE</given-names></name> <name><surname>Clementi</surname> <given-names>L</given-names></name> <etal/></person-group>. <article-title>MEME SUITE: tools for motif discovery and searching</article-title>. <source>Nucleic Acids Res.</source> (<year>2009</year>) <volume>37</volume>:<fpage>W202</fpage>&#x02013;<lpage>208</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkp335</pub-id><pub-id pub-id-type="pmid">19458158</pub-id></citation></ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>B</given-names></name> <name><surname>Brady</surname> <given-names>SW</given-names></name> <name><surname>Ma</surname> <given-names>X</given-names></name> <name><surname>Shen</surname> <given-names>S</given-names></name> <name><surname>Zhang</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>Therapy-induced mutations drive the genomic landscape of relapsed acute lymphoblastic leukemia</article-title>. <source>Blood.</source> (<year>2020</year>) <volume>135</volume>:<fpage>41</fpage>&#x02013;<lpage>55</lpage>. <pub-id pub-id-type="doi">10.1182/blood.2019002220</pub-id><pub-id pub-id-type="pmid">31697823</pub-id></citation></ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>C</given-names></name> <name><surname>Shen</surname> <given-names>S</given-names></name> <name><surname>Chen</surname> <given-names>X</given-names></name> <name><surname>Szlachta</surname> <given-names>K</given-names></name> <name><surname>Edmonson</surname> <given-names>MN</given-names></name> <etal/></person-group>. <article-title>Discovery of regulatory noncoding variants in individual cancer genomes by using cis-X</article-title>. <source>Nat Genet.</source> (<year>2020</year>) <volume>52</volume>:<fpage>811</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-020-0659-5</pub-id><pub-id pub-id-type="pmid">32632335</pub-id></citation></ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>Edmonson</surname> <given-names>MN</given-names></name> <name><surname>Wilkinson</surname> <given-names>MR</given-names></name> <name><surname>Patel</surname> <given-names>A</given-names></name> <name><surname>Wu</surname> <given-names>G</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name> <etal/></person-group>. <article-title>Exploring genomic alteration in pediatric cancer using ProteinPaint</article-title>. <source>Nat Genet.</source> (<year>2016</year>) <volume>48</volume>:<fpage>4</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1038/ng.3466</pub-id><pub-id pub-id-type="pmid">26711108</pub-id></citation></ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>X</given-names></name> <name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Patel</surname> <given-names>J</given-names></name> <name><surname>Valentine</surname> <given-names>M</given-names></name> <name><surname>Shao</surname> <given-names>Y</given-names></name> <name><surname>Newman</surname> <given-names>S</given-names></name> <etal/></person-group>. (<year>2021</year>). <article-title>Exploration of coding and non-coding variants in cancer using GenomePaint</article-title>. <source>Cancer Cell 39</source> <fpage>83</fpage>&#x02013;<lpage>95.e84</lpage>. <pub-id pub-id-type="doi">10.1016/j.ccell.2020.12.011</pub-id><pub-id pub-id-type="pmid">33434514</pub-id></citation></ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Weiss</surname> <given-names>MJ</given-names></name> <name><surname>Orkin</surname> <given-names>SH</given-names></name></person-group>. <article-title>GATA transcription factors: key regulators of hematopoiesis</article-title>. <source>Exp Hematol.</source> (<year>1995</year>) <volume>23</volume>:<fpage>99</fpage>&#x02013;<lpage>107</lpage>. <pub-id pub-id-type="pmid">7828675</pub-id></citation></ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bresnick</surname> <given-names>EH</given-names></name> <name><surname>Martowicz</surname> <given-names>ML</given-names></name> <name><surname>Pal</surname> <given-names>S</given-names></name> <name><surname>Johnson</surname> <given-names>KD</given-names></name></person-group>. <article-title>Developmental control via GATA factor interplay at chromatin domains</article-title>. <source>J Cell Physiol.</source> (<year>2005</year>) <volume>205</volume>:<fpage>1</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1002/jcp.20393</pub-id><pub-id pub-id-type="pmid">15887235</pub-id></citation></ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wu</surname> <given-names>D</given-names></name> <name><surname>Sunkel</surname> <given-names>B</given-names></name> <name><surname>Chen</surname> <given-names>Z</given-names></name> <name><surname>Liu</surname> <given-names>X</given-names></name> <name><surname>Ye</surname> <given-names>Z</given-names></name> <name><surname>Li</surname> <given-names>Q</given-names></name> <etal/></person-group>. <article-title>Three-tiered role of the pioneer factor GATA2 in promoting androgen-dependent gene expression in prostate cancer</article-title>. <source>Nucleic Acids Res.</source> (<year>2014</year>) <volume>42</volume>:<fpage>3607</fpage>&#x02013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkt1382</pub-id><pub-id pub-id-type="pmid">24423874</pub-id></citation></ref>
<ref id="B34">
<label>34.</label>
<citation citation-type="journal"><person-group person-group-type="author"><collab>Encode Project Consortium</collab></person-group>. <article-title>An integrated encyclopedia of DNA elements in the human genome</article-title>. <source>Nature.</source> (<year>2012</year>) <volume>489</volume>:<fpage>57</fpage>&#x02013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1038/nature11247</pub-id><pub-id pub-id-type="pmid">22955616</pub-id></citation></ref>
<ref id="B35">
<label>35.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davis</surname> <given-names>CA</given-names></name> <name><surname>Hitz</surname> <given-names>BC</given-names></name> <name><surname>Sloan</surname> <given-names>CA</given-names></name> <name><surname>Chan</surname> <given-names>ET</given-names></name> <name><surname>Davidson</surname> <given-names>JM</given-names></name> <name><surname>Gabdank</surname> <given-names>I</given-names></name> <etal/></person-group>. <article-title>The Encyclopedia of DNA elements (ENCODE): data portal update</article-title>. <source>Nucleic Acids Res.</source> (<year>2018</year>) <volume>46</volume>:<fpage>D794</fpage>&#x02013;<lpage>801</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkx1081</pub-id><pub-id pub-id-type="pmid">29126249</pub-id></citation></ref>
<ref id="B36">
<label>36.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rosati</surname> <given-names>A</given-names></name> <name><surname>Basile</surname> <given-names>A</given-names></name> <name><surname>Falco</surname> <given-names>A</given-names></name> <name><surname>D&#x00027;avenia</surname> <given-names>M</given-names></name> <name><surname>Festa</surname> <given-names>M</given-names></name> <name><surname>Graziano</surname> <given-names>V</given-names></name> <etal/></person-group>. <article-title>Role of BAG3 protein in leukemia cell survival and response to therapy</article-title>. <source>Biochim Biophys Acta.</source> (<year>2012</year>) <volume>1826</volume>:<fpage>365</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbcan.2012.06.001</pub-id><pub-id pub-id-type="pmid">22710027</pub-id></citation></ref>
<ref id="B37">
<label>37.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Torrano</surname> <given-names>V</given-names></name> <name><surname>Procter</surname> <given-names>J</given-names></name> <name><surname>Cardus</surname> <given-names>P</given-names></name> <name><surname>Greaves</surname> <given-names>M</given-names></name> <name><surname>Ford</surname> <given-names>AM</given-names></name></person-group>. <article-title>ETV6-RUNX1 promotes survival of early B lineage progenitor cells via a dysregulated erythropoietin receptor</article-title>. <source>Blood.</source> (<year>2011</year>) <volume>118</volume>:<fpage>4910</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2011-05-354266</pub-id><pub-id pub-id-type="pmid">21900195</pub-id></citation></ref>
<ref id="B38">
<label>38.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mansoor</surname> <given-names>A</given-names></name> <name><surname>Mansoor</surname> <given-names>MO</given-names></name> <name><surname>Patel</surname> <given-names>JL</given-names></name> <name><surname>Zhao</surname> <given-names>S</given-names></name> <name><surname>Natkunam</surname> <given-names>Y</given-names></name> <name><surname>Bieker</surname> <given-names>JJ</given-names></name></person-group>. <article-title>KLF1/EKLF expression in acute leukemia is correlated with chromosomal abnormalities</article-title>. <source>Blood Cells Mol Dis.</source> (<year>2020</year>) <volume>83</volume>:<fpage>102434</fpage>. <pub-id pub-id-type="doi">10.1016/j.bcmd.2020.102434</pub-id><pub-id pub-id-type="pmid">32311573</pub-id></citation></ref>
<ref id="B39">
<label>39.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Meyer</surname> <given-names>C</given-names></name> <name><surname>Lopes</surname> <given-names>BA</given-names></name> <name><surname>Caye-Eude</surname> <given-names>A</given-names></name> <name><surname>Cave</surname> <given-names>H</given-names></name> <name><surname>Arfeuille</surname> <given-names>C</given-names></name> <name><surname>Cuccuini</surname> <given-names>W</given-names></name> <etal/></person-group>. <article-title>Human MLL/KMT2A gene exhibits a second breakpoint cluster region for recurrent MLL-USP2 fusions</article-title>. <source>Leukemia.</source> (<year>2019</year>) <volume>33</volume>:<fpage>2306</fpage>&#x02013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1038/s41375-019-0451-7</pub-id><pub-id pub-id-type="pmid">30899083</pub-id></citation></ref>
<ref id="B40">
<label>40.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Girardi</surname> <given-names>T</given-names></name> <name><surname>Vicente</surname> <given-names>C</given-names></name> <name><surname>Cools</surname> <given-names>J</given-names></name> <name><surname>De Keersmaecker</surname> <given-names>K</given-names></name></person-group>. <article-title>The genetics and molecular biology of T-ALL</article-title>. <source>Blood.</source> (<year>2017</year>) <volume>129</volume>:<fpage>1113</fpage>&#x02013;<lpage>23</lpage>. <pub-id pub-id-type="doi">10.1182/blood-2016-10-706465</pub-id><pub-id pub-id-type="pmid">28115373</pub-id></citation></ref>
<ref id="B41">
<label>41.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leonard</surname> <given-names>M</given-names></name> <name><surname>Brice</surname> <given-names>M</given-names></name> <name><surname>Engel</surname> <given-names>JD</given-names></name> <name><surname>Papayannopoulou</surname> <given-names>T</given-names></name></person-group>. <article-title>Dynamics of GATA transcription factor expression during erythroid differentiation</article-title>. <source>Blood.</source> (<year>1993</year>) <volume>82</volume>:<fpage>1071</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1182/blood.V82.4.1071.1071</pub-id><pub-id pub-id-type="pmid">8353273</pub-id></citation></ref>
<ref id="B42">
<label>42.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gaine</surname> <given-names>ME</given-names></name> <name><surname>Sharpe</surname> <given-names>DJ</given-names></name> <name><surname>Smith</surname> <given-names>JS</given-names></name> <name><surname>Colyer</surname> <given-names>HA</given-names></name> <name><surname>Hodges</surname> <given-names>VM</given-names></name> <name><surname>Lappin</surname> <given-names>TR</given-names></name> <etal/></person-group>. <article-title>GATA2 regulates the erythropoietin receptor in t(12;21) ALL</article-title>. <source>Oncotarget.</source> (<year>2017</year>) <volume>8</volume>:<fpage>66061</fpage>&#x02013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.18632/oncotarget.19792</pub-id><pub-id pub-id-type="pmid">29029492</pub-id></citation></ref>
<ref id="B43">
<label>43.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grass</surname> <given-names>JA</given-names></name> <name><surname>Boyer</surname> <given-names>ME</given-names></name> <name><surname>Pal</surname> <given-names>S</given-names></name> <name><surname>Wu</surname> <given-names>J</given-names></name> <name><surname>Weiss</surname> <given-names>MJ</given-names></name> <name><surname>Bresnick</surname> <given-names>EH</given-names></name></person-group>. <article-title>GATA-1-dependent transcriptional repression of GATA-2 via disruption of positive autoregulation and domain-wide chromatin remodeling</article-title>. <source>Proc Natl Acad Sci U S A.</source> (<year>2003</year>) <volume>100</volume>:<fpage>8811</fpage>&#x02013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1432147100</pub-id><pub-id pub-id-type="pmid">12857954</pub-id></citation></ref>
<ref id="B44">
<label>44.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ikeda</surname> <given-names>J</given-names></name> <name><surname>Shiba</surname> <given-names>N</given-names></name> <name><surname>Tsujimoto</surname> <given-names>SI</given-names></name> <name><surname>Yoshida</surname> <given-names>M</given-names></name> <name><surname>Nakabayashi</surname> <given-names>K</given-names></name> <name><surname>Ogata-Kawata</surname> <given-names>H</given-names></name> <etal/></person-group>. <article-title>Whole transcriptome sequencing reveals a KMT2A-USP2 fusion in infant acute myeloid leukemia</article-title>. <source>Genes Chromosomes Cancer.</source> (<year>2019</year>) <volume>58</volume>:<fpage>669</fpage>&#x02013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1002/gcc.22751</pub-id><pub-id pub-id-type="pmid">30869817</pub-id></citation></ref>
<ref id="B45">
<label>45.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krivtsov</surname> <given-names>AV</given-names></name> <name><surname>Armstrong</surname> <given-names>SA</given-names></name></person-group>. <article-title>MLL translocations, histone modifications and leukaemia stem-cell development</article-title>. <source>Nat Rev Cancer.</source> (<year>2007</year>) <volume>7</volume>:<fpage>823</fpage>&#x02013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1038/nrc2253</pub-id><pub-id pub-id-type="pmid">17957188</pub-id></citation></ref>
<ref id="B46">
<label>46.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>W</given-names></name> <name><surname>Zhu</surname> <given-names>P</given-names></name> <name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Pascual</surname> <given-names>G</given-names></name> <name><surname>Ohgi</surname> <given-names>KA</given-names></name> <name><surname>Lozach</surname> <given-names>J</given-names></name> <etal/></person-group>. <article-title>Histone H2A monoubiquitination represses transcription by inhibiting RNA polymerase II transcriptional elongation</article-title>. <source>Mol Cell.</source> (<year>2008</year>) <volume>29</volume>:<fpage>69</fpage>&#x02013;<lpage>80</lpage>. <pub-id pub-id-type="doi">10.1016/j.molcel.2007.11.002</pub-id><pub-id pub-id-type="pmid">18206970</pub-id></citation></ref>
<ref id="B47">
<label>47.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tamburri</surname> <given-names>S</given-names></name> <name><surname>Lavarone</surname> <given-names>E</given-names></name> <name><surname>Fernandez-Perez</surname> <given-names>D</given-names></name> <name><surname>Conway</surname> <given-names>E</given-names></name> <name><surname>Zanotti</surname> <given-names>M</given-names></name> <name><surname>Manganaro</surname> <given-names>D</given-names></name> <etal/></person-group>. <article-title>Histone H2AK119 mono-ubiquitination is essential for polycomb-mediated transcriptional repression</article-title>. <source>Mol Cell.</source> (<year>2020</year>) <volume>77</volume>:<fpage>840</fpage>&#x02013;<lpage>56</lpage>.e845. <pub-id pub-id-type="doi">10.1016/j.molcel.2019.11.021</pub-id><pub-id pub-id-type="pmid">31883952</pub-id></citation></ref>
<ref id="B48">
<label>48.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hnisz</surname> <given-names>D</given-names></name> <name><surname>Weintraub</surname> <given-names>AS</given-names></name> <name><surname>Day</surname> <given-names>DS</given-names></name> <name><surname>Valton</surname> <given-names>AL</given-names></name> <name><surname>Bak</surname> <given-names>RO</given-names></name> <name><surname>Li</surname> <given-names>CH</given-names></name> <etal/></person-group>. <article-title>Activation of proto-oncogenes by disruption of chromosome neighborhoods</article-title>. <source>Science.</source> (<year>2016</year>) <volume>351</volume>:<fpage>1454</fpage>&#x02013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1126/science.aad9024</pub-id><pub-id pub-id-type="pmid">26940867</pub-id></citation></ref>
</ref-list> 
</back>
</article>