<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Neurosci.</journal-id>
<journal-title>Frontiers in Neuroscience</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Neurosci.</abbrev-journal-title>
<issn pub-type="epub">1662-453X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnins.2022.841145</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Identification of cortical interneuron cell markers in mouse embryos based on machine learning analysis of single-cell transcriptomics</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Zhandong</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/928572/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Deling</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1681391/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Guo</surname> <given-names>Wei</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/844845/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Shiqi</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/866888/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Lei</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/576896/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhang</surname> <given-names>Yu-Hang</given-names></name>
<xref ref-type="aff" rid="aff6"><sup>6</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/326927/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Lu</surname> <given-names>Lin</given-names></name>
<xref ref-type="aff" rid="aff7"><sup>7</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/903563/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Pan</surname> <given-names>XiaoYong</given-names></name>
<xref ref-type="aff" rid="aff8"><sup>8</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/857914/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Huang</surname> <given-names>Tao</given-names></name>
<xref ref-type="aff" rid="aff9"><sup>9</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/552766/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Cai</surname> <given-names>Yu-Dong</given-names></name>
<xref ref-type="aff" rid="aff10"><sup>10</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/103860/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>College of Biological and Food Engineering, Jilin Engineering Normal University</institution>, <addr-line>Changchun</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>State Key Laboratory of Oncology in South China, Department of Radiology, Collaborative Innovation Center for Cancer Medicine, Sun Yat-sen University Cancer Center</institution>, <addr-line>Guangzhou</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>Key Laboratory of Stem Cell Biology, Shanghai Jiao Tong University School of Medicine, Shanghai Institutes for Biological Sciences, Chinese Academy of Sciences</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Biostatistics, University of Copenhagen</institution>, <addr-line>Copenhagen</addr-line>, <country>Denmark</country></aff>
<aff id="aff5"><sup>5</sup><institution>College of Information Engineering, Shanghai Maritime University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff6"><sup>6</sup><institution>Channing Division of Network Medicine, Harvard Medical School, Brigham and Women&#x2019;s Hospital</institution>, <addr-line>Boston, MA</addr-line>, <country>United States</country></aff>
<aff id="aff7"><sup>7</sup><institution>Department of Radiology, Columbia University Irving Medical Center</institution>, <addr-line>New York, NY</addr-line>, <country>United States</country></aff>
<aff id="aff8"><sup>8</sup><institution>Key Laboratory of System Control and Information Processing, Ministry of Education of China, Institute of Image Processing and Pattern Recognition, Shanghai Jiao Tong University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff9"><sup>9</sup><institution>CAS Key Laboratory of Tissue Microenvironment and Tumor, Shanghai Institute of Nutrition and Health, University of Chinese Academy of Sciences, Chinese Academy of Sciences</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<aff id="aff10"><sup>10</sup><institution>School of Life Sciences, Shanghai University</institution>, <addr-line>Shanghai</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Anthony LaMantia, Virginia Tech, United States</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Daniel Meechan, Virginia Tech, United States; Nizhuan Wang, ShanghaiTech University, China</p></fn>
<corresp id="c001">&#x002A;Correspondence: Tao Huang, <email>tohuangtao@126.com</email></corresp>
<corresp id="c002">Yu-Dong Cai, <email>cai_yud@126.com</email></corresp>
<fn fn-type="equal" id="fn002"><p><sup>&#x2020;</sup>These authors have contributed equally to this work</p></fn>
<fn fn-type="other" id="fn004"><p>This article was submitted to Neurodevelopment, a section of the journal Frontiers in Neuroscience</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>15</day>
<month>07</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>16</volume>
<elocation-id>841145</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>12</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>06</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2022 Li, Wang, Guo, Zhang, Chen, Zhang, Lu, Pan, Huang and Cai.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Li, Wang, Guo, Zhang, Chen, Zhang, Lu, Pan, Huang and Cai</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Mammalian cortical interneurons (CINs) could be classified into more than two dozen cell types that possess diverse electrophysiological and molecular characteristics, and participate in various essential biological processes in the human neural system. However, the mechanism to generate diversity in CINs remains controversial. This study aims to predict CIN diversity in mouse embryo by using single-cell transcriptomics and the machine learning methods. Data of 2,669 single-cell transcriptome sequencing results are employed. The 2,669 cells are classified into three categories, caudal ganglionic eminence (CGE) cells, dorsal medial ganglionic eminence (dMGE) cells, and ventral medial ganglionic eminence (vMGE) cells, corresponding to the three regions in the mouse subpallium where the cells are collected. Such transcriptomic profiles were first analyzed by the minimum redundancy and maximum relevance method. A feature list was obtained, which was further fed into the incremental feature selection, incorporating two classification algorithms (random forest and repeated incremental pruning to produce error reduction), to extract key genes and construct powerful classifiers and classification rules. The optimal classifier could achieve an MCC of 0.725, and category-specified prediction accuracies of 0.958, 0.760, and 0.737 for the CGE, dMGE, and vMGE cells, respectively. The related genes and rules may provide helpful information for deepening the understanding of CIN diversity.</p>
</abstract>
<kwd-group>
<kwd>cortical interneuron diversity</kwd>
<kwd>ganglionic eminences</kwd>
<kwd>machine learning</kwd>
<kwd>rule learning</kwd>
<kwd>embryo</kwd>
</kwd-group>
<counts>
<fig-count count="5"/>
<table-count count="3"/>
<equation-count count="1"/>
<ref-count count="55"/>
<page-count count="11"/>
<word-count count="7644"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>Introduction</title>
<p>Cortical interneurons (CIN) are a group of cells in the human cerebral cortex, which participate in multiple essential biological processes in the human neural system, such as learning (<xref ref-type="bibr" rid="B41">Pi et al., 2013</xref>), vision (<xref ref-type="bibr" rid="B40">Pfeffer et al., 2013</xref>), and decision making (<xref ref-type="bibr" rid="B46">Wang, 2002</xref>). The cerebral cortex of human beings has more than dozen of CIN subgroups, such as multiple kinds of GABAergic interneurons (<xref ref-type="bibr" rid="B20">Kelsom and Lu, 2013</xref>). However, for a long time, the biological functions of how CINs are mediated by abundant, diverse cell subgroups has not been well known.</p>
<p>To investigate the complexity of CIN subgroups, the origins of CIN are clearly and reliably revealed, and how they differentiate into different cell subgroups is a premise. Early in 2002, researchers already revealed that most GABAergic interneurons are generated from embryonic forebrain in the cortical subventricular zone and further immigrate to other regions of the brain (<xref ref-type="bibr" rid="B15">Gelman and Mar&#x00ED;n, 2010</xref>). In adult human brains, the CINs originate from three regions, namely, caudal ganglionic eminence (CGE), dorsal medial ganglionic eminence (dMGE), and ventral medial ganglionic eminence (vMGE), with specific cellular components and biological functions (<xref ref-type="bibr" rid="B47">Wonders and Anderson, 2006</xref>; <xref ref-type="bibr" rid="B20">Kelsom and Lu, 2013</xref>). Although a rough picture about the formation of diverse CINs is emerging, how and when progenitors develop into multiple subgroups of CINs remain controversial. Two major CIN models have been made to interpret the timeline and biological procedures for the generation of CIN diversity (<xref ref-type="bibr" rid="B47">Wonders and Anderson, 2006</xref>):</p>
<p>Model 1: The diversity of CIN is invoked in the original region before they migrate.</p>
<p>Model 2: The diversity of CIN is regulated after the migration and by the local environment of each region.</p>
<p>To test and validate these two hypotheses, one effective approach could be to investigate the transcriptomic profiling at single cell level during embryo development (<xref ref-type="bibr" rid="B34">Mi et al., 2018</xref>). Recently, <xref ref-type="bibr" rid="B34">Mi et al. (2018)</xref> sequenced the transcriptome for cells collected from the three regions of origin of CIN (CGE, dMGE, and vMGE) in the mouse subpallium across two time points (embryonic days 12.5 and 14.5) and then explored the transcriptomic characteristics of the cells.</p>
<p>In this study, as inspired by <xref ref-type="bibr" rid="B34">Mi et al.&#x2019;s (2018)</xref> work, a more sophisticated bioinformatic analysis on the transcriptomic profiling of CIN cells is conducted by using the same data. Our hypothesis is that if cell types (CGE, dMGE, and vMGE cells) in the regions of origin could be predicted by their transcriptomic profiles, then &#x201C;The diversity of CIN is invoked in the original region&#x201D; (Model 1); otherwise, &#x201C;The diversity of CIN is regulated after the migration&#x201D; (Model 2). Our analysis consists of a series of machine learning algorithms, including the minimum redundancy and maximum relevance (mRMR) (<xref ref-type="bibr" rid="B39">Peng et al., 2005</xref>), the incremental feature selection (IFS) approach (<xref ref-type="bibr" rid="B29">Liu and Setiono, 1998</xref>), random forest (RF) (<xref ref-type="bibr" rid="B4">Breiman, 2001</xref>), and repeated incremental pruning to produce error reduction (RIPPER) (<xref ref-type="bibr" rid="B7">Cohen, 1995</xref>). After the analysis, several myoblast-associated genes (e.g., Lhx8, Calm1, Hmgb1, Meis2, Nr2f2, Basp1, BTAC, ZIC1, NR2F1, and RPS29) were identified and well interpreted via existing literature, and 23 quantitative rules were established to quantify the distribution of identified genes within the regions of origin.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="S2.SS1">
<title>Study design</title>
<p>Our study consisted of five parts, namely, (1) data collection, (2) feature representation, (3) feature ranking, (4) IFS and model building, and (5) top feature interpretation, as shown in <xref ref-type="fig" rid="F1">Figure 1</xref>. More details are presented in the following sections.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Overall workflow of the study.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-16-841145-g001.tif"/>
</fig>
</sec>
<sec id="S2.SS2">
<title>Dataset</title>
<p>The dataset consisted of 2,669 single cells downloaded from Gene Expression Omnibus (GEO) under the accession number of <ext-link ext-link-type="DDBJ/EMBL/GenBank" xlink:href="GSE109796">GSE109796</ext-link> (<xref ref-type="bibr" rid="B34">Mi et al., 2018</xref>), which contained RNA sequencing reports of 2,669 single cells acquired from tissues dissected from the subpallium of mouse embryos. The 2,669 single cells were divided into three cell types according to their regions of origin in the subpallium, namely, CGE cells, dMGE cells, and vMGE cells, whose numbers were 856, 957, and 856, respectively.</p>
</sec>
<sec id="S2.SS3">
<title>Feature representation</title>
<p>In the downloaded data, RNA sequencing for each cell was recorded by 37,310 reads per kilobase per million mapped reads (RPKM) values. The RPKM values of 6,037 transcripts showed zeros in all cells; thus, they were removed. Finally, each sample (each cell) was represented as a numeric vector of 31,273 RPKM values (37,310-6,037 = 31,273) and used as input in the following computational analysis.</p>
</sec>
<sec id="S2.SS4">
<title>Feature ranking</title>
<p>As mentioned in section &#x201C;Feature representation,&#x201D; lots of features were used to represent each cell sample. Clearly, not all features were related to the classification of cell types. A feature analysis procedure was necessary. In our study, the mRMR method (<xref ref-type="bibr" rid="B39">Peng et al., 2005</xref>) was employed for completing this task. mRMR is a filter-based feature analysis algorithm that could retain feature relevance to classification labels while reducing redundance among features, that is, maximizing the correlation between features and labels while minimizing the correlation between features themselves. However, such purpose is difficult to achieve because the problem is NP-hard. Thus, mRMR gives a heuristic scheme, which sorts feature in a list, named mRMR feature list. At the beginning, this list is empty. The mRMR method selects one feature, which has highest relevance to classification labels and lowest redundance to already-selected features, and appends such feature to the list in each round. This procedure stops until all features are in the list. Evidently, features with the top ranks in the list had the most relevance to classification labels and less correlation to the rest of the other features. Thus, they can comprise a compact feature subspace to represent samples.</p>
<p>This study adopted the mRMR program reported in <ext-link ext-link-type="uri" xlink:href="http://home.penglab.com/proj/mRMR/">http://home.penglab.com/proj/mRMR/</ext-link>. It was performed with its default parameters.</p>
</sec>
<sec id="S2.SS5">
<title>Feature selection and model building</title>
<p>As mRMR method only sorts features in the mRMR list. Which features are important and can be picked up for constructing classifiers is still a problem. In view of this, the IFS method (<xref ref-type="bibr" rid="B29">Liu and Setiono, 1998</xref>) followed to analyze this list in this study. It is a feature screening approach to determine the optimal number of features. To perform IFS on the mRMR feature list, a series of feature subsets with a step of 10 features was first generated, that is, the <italic>i</italic>-th feature subset contained the first 10 &#x00D7; <italic>i</italic> features from the mRMR list. For each subset, a classifier was trained based on one classification algorithm and samples consisting of the features from this feature subset. This classifier was further evaluated by 10-fold cross-validation (<xref ref-type="bibr" rid="B25">Kohavi, 1995</xref>; <xref ref-type="bibr" rid="B5">Chen et al., 2017</xref>; <xref ref-type="bibr" rid="B54">Zhou et al., 2020</xref>; <xref ref-type="bibr" rid="B55">Zhu et al., 2021</xref>). Then, the classifier giving the optimal performance can be obtained. This classifier was termed as the optimal classifier, whereas the features used in this classifier were called optimal features.</p>
<p>As mentioned above, a classification algorithm is necessary for IFS method. Here, two widely used machine-learning classification algorithms were adopted for building classifiers in this study, namely, the RF (<xref ref-type="bibr" rid="B4">Breiman, 2001</xref>) and RIPPER (<xref ref-type="bibr" rid="B7">Cohen, 1995</xref>) algorithms. RF is a meta classifier that contains many decision trees, and each tree is grown from a bootstrap set with a randomly selected feature subset. For making a prediction, its output label is determined by aggregating votes from different decision trees. Several differences always exist between different decision trees in the forest. RF usually averages the prediction results of all decision trees to reduce errors and avoid overfitting. Although this slightly increases the bias and loses some interpretability, it improves prediction performance. RF is always quite efficient to construct classifiers and has wide applications in the fields of bioinformatics (<xref ref-type="bibr" rid="B38">Pan et al., 2010</xref>; <xref ref-type="bibr" rid="B19">Jia et al., 2020</xref>; <xref ref-type="bibr" rid="B28">Liang et al., 2020</xref>; <xref ref-type="bibr" rid="B6">Chen et al., 2021</xref>; <xref ref-type="bibr" rid="B48">Zhang et al., 2021c</xref>). In this study, we directly employed the tool &#x201C;RandomForest&#x201D; in Weka (<xref ref-type="bibr" rid="B13">Frank et al., 2004</xref>), which implements the RF. For convenience, default parameters were used, where the number of decision trees is set to 100.</p>
<p>Although the RF classifier can be efficient to classify CIN cells, it cannot give useful clues to uncover differences of CIN cells from different regions. In view of this, we further employed another classification algorithm, RIPPER. In fact, it is a rule-based algorithm that could generate classification rules to predict cells into different region-based groups. In RIPPER, the training set is first separated into the growing set and pruning set. Then, the rule grows, and the prune phase is repeated until no positive samples are left in the growing set. During the process, one rule is generated by greedily adding conditions to the rule. It predicts the classification of new data based on the interpretable classification IF&#x2013;ELSE rules. Although the RIPPER classifier is generally weaker than RF classifier, it has its own merits. For CIN cells investigated in this study, the rules contained in the RIPPER classifier can clearly indicate the patterns of cells in different regions, giving new insights to study CIN cells. Thus, RIPPER has also been applied to analyze some complicated biological or medical systems (<xref ref-type="bibr" rid="B27">Li et al., 2020</xref>; <xref ref-type="bibr" rid="B51">Zhang et al., 2020</xref>, <xref ref-type="bibr" rid="B49">2021a</xref>). Likewise, the tool &#x201C;JRip&#x201D; in Weka (<xref ref-type="bibr" rid="B13">Frank et al., 2004</xref>) was directly used in this study, which implements the above RIPPER. Also, it was executed using default parameters.</p>
</sec>
<sec id="S2.SS6">
<title>Model interpretation</title>
<p>In our study, the interpretation of model consisted of two parts, interpretation on (1) single-gene and (2) combined-gene rules. Single-gene interpretation focused on the optimal genes (i.e., the feature in the sample vector) selected by IFS with RF, whereas interpretation on combined-gene rule focuses on the optimal rules outputted by IFS with RIPPER. Our interpretation was based on comprehensive literature reviewing on previous works.</p>
</sec>
<sec id="S2.SS7">
<title>Performance measurement</title>
<p>Two quantitative metrics were used to indicate the performance of different models, namely, prediction accuracy (ACC) and Matthew correlation coefficients (MCC) (<xref ref-type="bibr" rid="B32">Matthews, 1975</xref>; <xref ref-type="bibr" rid="B16">Gorodkin, 2004</xref>; <xref ref-type="bibr" rid="B52">Zhao et al., 2018</xref>; <xref ref-type="bibr" rid="B37">Pan et al., 2021</xref>; <xref ref-type="bibr" rid="B50">Zhang et al., 2021b</xref>). ACC could directly show the proportion of correctly predicted samples among all samples. However, this measurement is not very correct if the sizes of classes are of great differences. In this case, MCC is more objective. To calculate such measurement, two matrices, say <italic>X</italic> and <italic>Y</italic>, should be constructed first, where <italic>X</italic> denotes the true class of each sample and <italic>Y</italic> represented the predicted class of each sample. Accordingly, MCC can be computed by</p>
<disp-formula id="S2.E1">
<label>(1)</label>
<mml:math id="M1">
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>C</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>C</mml:mi>
</mml:mrow>
<mml:mo>=</mml:mo>
<mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>o</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>v</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>o</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>v</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>X</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>c</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>o</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mi>v</mml:mi>
<mml:mo>&#x2062;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>Y</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msqrt>
</mml:mfrac>
</mml:mrow>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where cov(&#x25CF;) stands for the correlation coefficient of two matrices. The return values of ACC and MCC are continuous values with range of 0&#x2013;1 and -1 to 1, respectively. The higher the ACC and MCC values are, the better performance for the classifiers.</p>
<p>In addition, we also employed the individual accuracy to measure the performance of each classifier. For each class, the individual accuracy of this class is defined as the proportion of correctly predicted samples in this class among all samples in this class. Evidently, high individual accuracy indicates the good performance of one classifier on some class.</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>Results</title>
<p>In our study, 2,669 single-cell samples were collected, and each cell was represented as a numeric vector with 31,273 features. Each feature in the sample vector corresponded to the expression of one gene. The 2,669 samples were divided into three categories, CGE cells (856, 32%), dMGE cells (957, 36%), and vMGE cells (856, 32%). The entire analysis procedures are illustrated in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<sec id="S3.SS1">
<title>Results of feature ranking</title>
<p>The dataset containing 31,273 features was first analyzed by the mRMR method. The mRMR feature list was obtained, which is provided in <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>. Features with high ranks were essential for distinguishing CIN cells.</p>
</sec>
<sec id="S3.SS2">
<title>Prediction performance</title>
<p>Based on the mRMR feature list, RF and RIPPER were employed to build the classifiers in the approach of IFS.</p>
<p>When RF was selected in the IFS method, we constructed several RF classifiers on different feature subsets. The performance of these classifiers is listed in <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>. For an easy observation, an IFS curve was plotted, as shown in <xref ref-type="fig" rid="F2">Figure 2</xref>, where <italic>x</italic>-axis stands for the number of features in the feature subset and <italic>y</italic>-axis stands for the MCC. The highest MCC was 0.725 when top 240 features were used. Accordingly, these 240 features were the optimal features for RF and an optimal RF classifier was constructed with these optimal features. The ACC of this classifier was 0.816, as listed in <xref ref-type="table" rid="T1">Table 1</xref>. The individual accuracies on CIN cells in three regions are shown in <xref ref-type="fig" rid="F3">Figure 3</xref>. Most CGE cells were correctly predicted with individual accuracy higher than 0.950, whereas the other two individual accuracies were not very high. As a whole, this classifier gave good performance. However, this RF classifier used lots of features. It would not be efficient if lots of samples were inputted. In view of this, we enlarged the IFS curve between 10 and 500, as shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. It can be observed that the curve followed a sharp increasing trend when the number of features were small. After that, the curve became stable. When top 120 features were adopted, the MCC reached 0.711, which was a little lower than that yielded by the optimal RF classifier (0.725). As for ACC, it was 0.807 (<xref ref-type="table" rid="T1">Table 1</xref>), also slightly lower than that produced by the optimal RF classifier (0.816). The individual accuracies of this classifier are illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref>. All were a little lower than those of the optimal RF classifier. These results indicated that the RF classifier with top 120 features provided almost equal performance to the optimal RF classifier. However, it involved much less features, indicating higher efficiency. This RF classifier can be an efficient tool to classify CIN cells. Furthermore, the top 120 features were much more important than the following 120 features. It was valuable to investigate their relationships to CIN cells. Furthermore, to further assess such latent tool, it was tested by additional 10-fold cross-validation for ten times. A box plot, as shown in <xref ref-type="fig" rid="F5">Figure 5</xref>, was drawn for obtained ACC and MCC values. Evidently, they were changed in a small range, indicating the stability of the tool.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>The IFS curves of RIPPER and RF. RIPPER can reach the highest MCC of 0.577, whereas RF can reach the highest MCC of 0.725.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-16-841145-g002.tif"/>
</fig>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Performance of some key classifiers.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Classification algorithm</td>
<td valign="top" align="center">Number of features</td>
<td valign="top" align="center">ACC</td>
<td valign="top" align="center">MCC</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">RIPPER</td>
<td valign="top" align="center">1,650</td>
<td valign="top" align="center">0.718</td>
<td valign="top" align="center">0.577</td>
</tr>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="center">240</td>
<td valign="top" align="center">0.816</td>
<td valign="top" align="center">0.725</td>
</tr>
<tr>
<td valign="top" align="left">RF</td>
<td valign="top" align="center">120</td>
<td valign="top" align="center">0.807</td>
<td valign="top" align="center">0.711</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>The Individual accuracies of some key classifier. Two RF classifiers provide almost equal performance and are superior to the RIPPER classifier.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-16-841145-g003.tif"/>
</fig>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>The IFS curve of RF between 10 and 500. The RF classifier with top 120 features yielded a little lower MCC than the classifier with top 240 features, which is the optimal RF classifier.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-16-841145-g004.tif"/>
</fig>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Box plot to show the performance of RF classifier with top 120 features under 10-fold cross-validation for 10 times. ACC and MCC vary in a small range, indicating the stability of the classifier.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnins-16-841145-g005.tif"/>
</fig>
<p>Although the above RF classifiers provided satisfied performance, they provided less even no useful clues to uncover differences of CIN cells in different regions because RF is a black-box algorithm. Thus, we also adopted RIPPER in the IFS method. The performance of RIPPER classifiers on all tested feature subsets is provided in <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>. An IFS curve was plotted in <xref ref-type="fig" rid="F2">Figure 2</xref> to show their performance. The highest MCC was 0.577 when top 1,650 features were used. Thus, these features were the optimal features for RIPPER and the optimal RIPPER classifier was built based on them. The ACC of this classifier was 0.718, as listed in <xref ref-type="table" rid="T1">Table 1</xref>. Evidently, MCC and ACC were much lower than those of above RF classifiers. As for the individual accuracies, they are illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref>. They were also much lower than those of the above RF classifiers. All these indicated that the optimal RIPPER classifier was much inferior to above two RF classifiers. However, some useful information can be extracted from this RIPPER classifier, which would be listed in section &#x201C;Top feature interpretation.&#x201D; This information was helpful to uncover the difference of CINs cells in different regions.</p>
</sec>
<sec id="S3.SS3">
<title>Top feature interpretation</title>
<p>With the help of IFS and RF, we extracted 120 essential features, which are the first 120 features listed in <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>. These features were deemed to play essential roles to distinguish CIN cells in different regions. Their corresponding genes can be essential single-genes to classify CIN cells.</p>
<p>Furthermore, in our study, RIPPER was employed to generate classification rules to reveal how features interacted with one another, thus predicting cell types. The optimal RIPPER classifier used top 1,650 features. Cell samples represented by these features were learnt by RIPPER, resulting in 23 rules, as listed in <xref ref-type="table" rid="T2">Table 2</xref>. 12 rules were for CGE cells, 9 rules were for vMGE cells and the last rule was for dMGE cells. CGE cell rules ranked higher than the two MGE cell rules, which complied with the observation that CGE cells are easier to be distinguished by their transcriptomic characteristics.</p>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>The 22 classification rules generated by RIPPER for predicting cell types.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Index</td>
<td valign="top" align="left">Rule</td>
<td valign="top" align="center">Label</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">1</td>
<td valign="top" align="left">NKX2-1 &#x2264; 3.6524) and (MT-TM &#x2265; 1.4699) and (MEIS2 &#x2265; 0.7558) and (H3F3B &#x2265; 2019.223223)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">2</td>
<td valign="top" align="left">(FOXP2 &#x2265; 0.0047) and (NKX2-1 &#x2264; 5.5415) and (TMSB10 &#x2264; 76.7268) and (NR2F1 &#x2265; 25.2511)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">3</td>
<td valign="top" align="left">(NKX2-1 &#x2264; 12.9594) and (RPS20 &#x2264; 17.1104) and (SLC7A11 &#x2265; 0.0538) and (PID1 &#x2265; 0.4191) and (LHX8 &#x2264; 0.0839)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">4</td>
<td valign="top" align="left">(NR2F2 &#x2265; 0.2374) and (LHX6 &#x2264; 0.3856) and (5730494M16RIK &#x003E; = 14.4383) and (LHX8 &#x2264; 7.0592)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">5</td>
<td valign="top" align="left">(FOXP2 &#x2265; 0.1294) and (EPHA5 &#x2265; 25.8453) and (RPS9 &#x2264; 159.5439) and (DCX &#x2265; 49.7284)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">6</td>
<td valign="top" align="left">(NR2F2 &#x2265; 2.2717) and (EPHA5 &#x2265; 3.4019) and (LHX8 &#x2264; 0) and (MEIS2 &#x2265; 18.9392) and (NCAPH &#x2264; 2.4094)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">7</td>
<td valign="top" align="left">(ENC1 &#x2264; 1.8862) and (NKX2-1 &#x2264; 12.0905) and (STX7 &#x2265; 0.3228) and (CALM1 &#x2264; 546.2493) and (SOX6 &#x2264; 2.8190)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">8</td>
<td valign="top" align="left">(GM6180 &#x2265; 36.7994) and (FOXP2 &#x2265; 3.5745) and (GM13340 &#x2265; 34.469118)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">9</td>
<td valign="top" align="left">(EPHA5 &#x2265; 0.1196) and (LHX8 &#x2264; 0.1496) and (GM15266 &#x2264; 19.2334) and (GM1821 &#x2264; 89.839694) and (CALM1 &#x2264; 744.1502)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">10</td>
<td valign="top" align="left">(BIRC6 &#x2264; 0) and (NKX2-1 &#x2264; 10.7393) and (CRIP2 &#x2265; 400.8077) and (ZFP238 &#x2265; 6.1810) and (GM10039 &#x2265; 12.3788)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">11</td>
<td valign="top" align="left">(ARRDC3 &#x2265; 368.6154) and (PTPRS &#x2264; 24.5126) and (ZFP238 &#x2264; 70.9705)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">12</td>
<td valign="top" align="left">(ZFP503 &#x2265; 0.1111) and (MAP4K4 &#x2264; 7.0016)</td>
<td valign="top" align="center">Caudal ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">13</td>
<td valign="top" align="left">(LHX8 &#x2265; 1.4487) and (ZIC1 &#x2265; 0.0111)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">14</td>
<td valign="top" align="left">(LHX8 &#x2265; 0.3736) and (NR2F1 &#x2264; 9.4921) and (ZSWIM5 &#x2264; 0.0334)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">15</td>
<td valign="top" align="left">(NR2F1 &#x2264; 15.6811) and (CD24A &#x2265; 2.7069) and (BASP1 &#x2264; 66.0865) and (PKIA &#x2264; 1.8492)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">16</td>
<td valign="top" align="left">(PAK3 &#x2264; 0.7899) and (RPS18 &#x2265; 4.9001) and (PID1 &#x2265; 1.2578)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">17</td>
<td valign="top" align="left">(YWHAZ &#x2265; 1.8915) and (SEPT11 &#x2264; 7.8189) and (GM13604 &#x2264; 0.2081) and (H2AFV &#x2265; 1305.9678)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">18</td>
<td valign="top" align="left">(PAK3 &#x2264; 0.0474) and (CFL1 &#x2265; 31.1042) and (GTF2A1 &#x2264; 20.8911) and (LHX6 &#x2264; 5.6025)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">19</td>
<td valign="top" align="left">(GM15266 &#x2264; 63.0475) and (MT-RNR2 &#x2265; 9387.3828)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">20</td>
<td valign="top" align="left">(CITED2 &#x2264; 35.2427) and (GM10718 &#x2264; 1.0898) and (2610017I09RIK &#x2264; 2442.7505) and (GSK3B &#x2264; 1.5164)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">21</td>
<td valign="top" align="left">(UBE2QL1 &#x2265; 1.5601) and (3110003A17RIK &#x2265; 20.2789) and (RTN1 &#x2264; 4.7837)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">22</td>
<td valign="top" align="left">(GM3511 &#x2265; 22.9860) and (PTMA &#x2265; 2.2359) and (LHX6 &#x2264; 47.9178)</td>
<td valign="top" align="center">Ventral medial ganglionic eminence</td>
</tr>
<tr>
<td valign="top" align="left">23</td>
<td valign="top" align="left">Others</td>
<td valign="top" align="center">Dorsal medial ganglionic eminence</td>
</tr>
</tbody>
</table></table-wrap>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>Discussion</title>
<p>As mentioned above, 120 features for the RF classifier for CIN cell types were filtered out. The transcriptomic level profiling of candidate genes was associated with CIN development. The literature was searched for the top 30 features, and these features were supported by previous studies as potential biomarkers. Considering length restriction, 10 features were selected for detailed discussion, as listed in <xref ref-type="table" rid="T3">Table 3</xref>. A series of quantitative rules was also identified for detailed prediction on CGE, dMGE, and vMGE cells, laying a foundation for further analyses in this field.</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Details of essential genes.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Gene symbol</td>
<td valign="top" align="center">Description</td>
<td valign="top" align="center">Rank in the feature list</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Lhx8</td>
<td valign="top" align="center">LIM homeobox 8</td>
<td valign="top" align="center">2</td>
</tr>
<tr>
<td valign="top" align="left">Calm1</td>
<td valign="top" align="center">Calmodulin 1</td>
<td valign="top" align="center">4</td>
</tr>
<tr>
<td valign="top" align="left">Hmgb1</td>
<td valign="top" align="center">High mobility group box 1</td>
<td valign="top" align="center">9</td>
</tr>
<tr>
<td valign="top" align="left">Meis2</td>
<td valign="top" align="center">Meis homeobox 2</td>
<td valign="top" align="center">12</td>
</tr>
<tr>
<td valign="top" align="left">Nr2f2</td>
<td valign="top" align="center">Nuclear receptor subfamily 2 group F member 2</td>
<td valign="top" align="center">22</td>
</tr>
<tr>
<td valign="top" align="left">Basp1</td>
<td valign="top" align="center">Brain abundant membrane attached signal protein 1</td>
<td valign="top" align="center">7</td>
</tr>
<tr>
<td valign="top" align="left">Actb</td>
<td valign="top" align="center">Actin beta</td>
<td valign="top" align="center">23</td>
</tr>
<tr>
<td valign="top" align="left">Zic1</td>
<td valign="top" align="center">Zic family member 1</td>
<td valign="top" align="center">30</td>
</tr>
<tr>
<td valign="top" align="left">Nr2f1</td>
<td valign="top" align="center">Nuclear receptor subfamily 2 group F member 1</td>
<td valign="top" align="center">15</td>
</tr>
<tr>
<td valign="top" align="left">Rps29</td>
<td valign="top" align="center">Ribosomal protein S29</td>
<td valign="top" align="center">18</td>
</tr>
</tbody>
</table></table-wrap>
<sec id="S4.SS1">
<title>Genes associated with cortical interneurons</title>
<p><bold>Lhx8</bold>, the top predicted candidate, is a member of LIM-class homeobox genes. According to recent publications, Lhx8 contributes to the regulation of neuronal Shh expression in MGE. Such gene has also been identified to prevent Nkx2-1 expression in a subset of pallial interneurons (<xref ref-type="bibr" rid="B12">Flandin et al., 2011</xref>), suggesting that Lhx8 plays an important role in regulating the early born MGE neurons. In addition, Lhx8 has a special function in the development of neurons. Lhx8 is a major source of cholinergic neurons, and <xref ref-type="bibr" rid="B53">Zhao et al. (2003)</xref> proved that Lhx8 is quite essential during cholinergic neurons&#x2019; development in the forebrain. Integrating the literature supports mentioned above, speculating that Lhx8 as one of our candidates has differential profiling patterns in MGE neuron cells and other cells, consistent with our prediction results, is quite reasonable.</p>
<p><bold>Calm1</bold>, another identified CIN-associated gene encodes a kind of calmodulin (CaM), an effective calcium ion sensor and signal transductor. Neuronal migration is associated with our predicted gene, which may further indicate the potential contribution of our predicted genes on the development of the nervous system. <xref ref-type="bibr" rid="B24">Kobayashi et al. (2014)</xref> reported that Calm1 acts as a specific regulator in the tangential and radial migration of mouse neuron cells. Neuronal migration is a key process in the developing and adult brain, and <xref ref-type="bibr" rid="B21">Khodosevich et al. (2009)</xref> indicated that the knockdown of Calm1 affects neuroblast migration to the OB, suggesting that Calm1 can be an important gene in the regulation of neuron development. Integrating the literature supports mentioned above, Calm1 is confirmed to be a CIN-associated gene.</p>
<p>Another identified gene is <bold>Hmgb1</bold>, which is like histones among the most important chromatin proteins. Hmgb1, a novel cytokine-like mediator, is associated with microglial activation (<xref ref-type="bibr" rid="B22">Kim et al., 2006</xref>). According to recent publications (<xref ref-type="bibr" rid="B23">Kim et al., 2011</xref>), Hmgb1 participates in the regulation in danger signaling and cell death control, acting as a ubiquitously expressed non-histone DNA-binding protein. In addition, Hmgb1 plays various roles in different stages of brain development (<xref ref-type="bibr" rid="B42">Ping et al., 2012</xref>). During early brain development, fore brain development including neurite outgrowth is also associated with Hmgb1. During aging, it is associated with injury induced inflammation. Integrating the literature supports mentioned above, Hmgb1 is suggested to be an important feature to classify the different types of CIN, including CGE, dMGE, vMGE. Overall, effective gene Hmgb1 may also have the capacity to distinguish CGE, dMGE, and vMGE cases.</p>
<p><bold>Meis2</bold>, the next predicted gene, is associated with the development of neural crest cells (<xref ref-type="bibr" rid="B30">Machon et al., 2015</xref>). In early brain development processes, Meis2 participates in the positive and negative regulation of feed-back and feed-forward loops (<xref ref-type="bibr" rid="B1">Agoston et al., 2012</xref>). However, Meis can interact with various trophic factor signaling pathways during neuron differentiation (<xref ref-type="bibr" rid="B3">Bouilloux et al., 2015</xref>), suggesting that Meis can be an essential factor in development of neuron cells. Therefore, our predicted gene, Meis, may be identified as a special factor in classifying CGE, dMGE, and vMGE cases.</p>
<p><bold>Nr2f2</bold> is the following predicted gene in our predicted list. Nr2f2, also known as COUP transcription factor 2, participates in development of CIN subtypes (MGE). <xref ref-type="bibr" rid="B18">Hu et al. (2017)</xref> indicated that the expression level of Nr2f2 is associated with time-dependent specification of layer STT and the survival of neuroepithelium during brain development. <xref ref-type="bibr" rid="B14">Fuentealba et al. (2010)</xref> also proved that as a transcription factor, such gene contributes to the cell type specific development and differentiation control, especially for neurons. Integrating the literature supports mentioned above, speculating that Nr2f2 as a predicted gene may be differentially expressed in CGE, dMGE, and vMGE cases is quite reasonable, validating our prediction.</p>
<p>Another screened out biomarker in our optimal candidates is <bold>Basp1</bold>, also known as GAP-23, which is a well-known member from the family of growth-associated proteins and associated with the protein GAP-43 that is shown to regulate neural cell adhesion molecule controlled outgrowth of neurite. In addition to shared biological functions with GAP-43, Basp1 contributes to the regulation of cellular morphology for plasma membrane (<xref ref-type="bibr" rid="B26">Korshunova et al., 2010</xref>). In addition, membrane-binding Basp1 oligomers are associated with the physiological or pathological in-ion channel activity (<xref ref-type="bibr" rid="B36">Ostroumova et al., 2011</xref>). Integrating the literature supports mentioned above, Basp1 is also associated with the development of neuron cells. Overall, Basp1 as another predicted gene can also distinguish such three regions in CINs.</p>
<p>Beta-actin (<bold>Actb</bold>) is the next gene related to classify the neuron cells. Beta-actin is a conserved protein of six different actin isoforms regulating cell motility, structure, and integrity. Elongating growth is regulated by our predicted gene Actb via axon branching and translation (<xref ref-type="bibr" rid="B11">Donnelly et al., 2013</xref>). Beta-actin can affect the development of neuron cell via essential biological processes for brain development. Beta-actin is a kind of microtubule motor protein during dendritic transport. Integrating the reports mentioned above, beta-actin contributes to the development of neuron cells, suggesting that our predicted gene, BTAC, may be identified as a special factor in distinguishing different CIN regions.</p>
<p><bold>Zic1</bold> is a member of the zinc finger of the cerebellum Zic protein family. It is classified as a Zic protein due to the conservation of the five C2H2 zinc fingers, and the correct function of this protein is critical for early development. <xref ref-type="bibr" rid="B10">Dipietrantonio and Dymecki (2009)</xref> proved that Zic1 levels in pontine gray neurons play an important in the development of pontocerebellar circuit. Therefore, Zic1 can influence the development of brain neurons by pontocerebellar circuity. Zic1 can activate and regulate neural crest development and differentiation at transcriptomic level (<xref ref-type="bibr" rid="B35">Milet et al., 2013</xref>; <xref ref-type="bibr" rid="B2">Bae et al., 2014</xref>). ZIC1 may be identified as a special factor in distinguishing CGE, dMGE, and vMGE cases.</p>
<p>The next two predicted genes, <bold>Nr2f1</bold> and <bold>Rps29</bold>, are associated with optic atrophy syndrome (<xref ref-type="bibr" rid="B17">Henning et al., 2016</xref>) and neuronal gene orthopedic protein (<xref ref-type="bibr" rid="B44">Taylor et al., 2012</xref>). Optic atrophy syndrome is a kind of neuronal disease, and orthopedic protein is a protein related to the development of neuron. Overall, these two genes participate in neuron development. Therefore, they can be the factors in classifying CGE, dMGE, and vMGE cases.</p>
</sec>
<sec id="S4.SS2">
<title>Rules associated with cortical interneurons</title>
<p>In addition to such feature analysis, 22 quantitative rules for brain region clustering for CGE, dMGE, and vMGE cells were identified. Some expression tendencies were confirmed and validated by recent publications. For further validation on such quantitative rules and parameters, the GEO database was screened for accurate FPKM screening. The detailed discussion of each quantitative rule is shown below.</p>
<p>The top 11 rules are associated with the identification of CGE cells, involving <bold>Nkx2-1</bold>, <bold>Foxp2</bold>, <bold>Lhx8</bold>, and <bold>Epha5</bold>. A relatively high expression level of FOXP2 (FPKM &#x003E; 0) and EPHA5 (FPKM &#x003E; 3.4), and low expressions of NKX2-1 (FPKM &#x003C; 3.65) and LHX8 (FPKM &#x003C; 0) may indicate such CIN case turns out to be a CGE case. According to the biological functions of such genes, FOXP2 is associated with multiple essential functions in human beings including speech and language phenotypes (<xref ref-type="bibr" rid="B43">Rodenas-Cuadrado et al., 2018</xref>). Epha5 is an effective kinase from the Eph family, which plays important roles in neural development (<xref ref-type="bibr" rid="B9">Das et al., 2016</xref>). Therefore, high expression of these genes can promote the neural development. Our predicted transcription factor NKX2-1 plays a special role in the specification of subsets of cortical, stratal, and pallidal neurons (<xref ref-type="bibr" rid="B31">Magno et al., 2017</xref>). Therefore, detected expression of these genes is regarded an effective quantitative filter for the identification of CGE cells.</p>
<p>The following rules contribute to the identification of vMGE cells. Parameters <bold>Lhx8</bold> and <bold>Pak3</bold> are abnormally expressed as potential biomarkers of such group of cells. As reported, a relatively higher expression level of Lhx8 (FPKM &#x003E; 1.45) and low expression level of PAK3 (FPKM &#x003C; 0.79) may indicate such CIN case turns out to be a vMGE cells.</p>
<p>According to the biological functions of such genes, a feedback loop between Lhx8 and NGF is associated with the cholinergic functions and may participate in learning and memory (<xref ref-type="bibr" rid="B45">Tomioka et al., 2014</xref>). Moreover, PAK3 as a GTPase regulated enzyme has alternative kinase activity with different splicing variants (<xref ref-type="bibr" rid="B8">Combeau et al., 2012</xref>), indicating that PAK3 has a critical function in the development of neuron cells. Therefore, detected expression of these genes is regarded a potential parameter for the distinction of CINs.</p>
<p>For cells not following the expression patterns discussed above, they were predicted as dMGE cells.</p>
</sec>
<sec id="S4.SS3">
<title>Comparison with previously reported cortical interneuron associated biomarkers</title>
<p>Previously, two studies about cortical interneuron associated biomarkers have been presented (<xref ref-type="bibr" rid="B33">Mayer et al., 2018</xref>; <xref ref-type="bibr" rid="B34">Mi et al., 2018</xref>). Various biomarkers identified in this study have also been validated in such two studies. For instance, in <xref ref-type="bibr" rid="B33">Mayer et al.&#x2019;s (2018)</xref> study, four genes, including NKX2-1, NR2F1, NR2F2, and CITED2, were also identified. The specific biomarkers like NKX2-1 and NR2F2 have been identified in both two previously studies. As discussed above, both genes have been validated by recent publications with solid experimental supports. The identification of these biomarkers that have also been reported in similar studies validated the utility of our method. However, other biomarkers, like Calm1 and Epha5, have not been recognized by previous studies, indicating that our study may discover new biomarkers for different subgroups of CINs, and therefore, provide a new perspective into the subgrouping of cortical interneuron.</p>
</sec>
<sec id="S4.SS4">
<title>Limitations of this study</title>
<p>As discussed above, we identified a group of functional genes and specific quantitative rules that contribute to the prediction of CIN cell types. However, there remain certain limitations in our analyses. Firstly, the result may be affected by the cell-type specificity of each gene in the dataset we used. For instance, YWHAZ is specifically expressed in projection neurons, but ribosomal protein subunits may be identified in almost each cell. Therefore, YWHAZ is more likely to be identified as a biomarker in a dataset with a lot of projection neurons. Secondly, the interpretation and discussion on the sub-division groups and related biological functions just provided a probable explanation for the machine learning based sub-classification results according to previously reported publications, which may not necessary be the actual biological mechanisms. Thirdly, we only tried to identify CIN cell subgrouping biomarkers in one dataset. Further validation of our results in matched mouse model will be accomplished in the next step of our analyses.</p>
</sec>
</sec>
<sec id="S5" sec-type="conclusion">
<title>Conclusion</title>
<p>In this study, machine learning algorithms were applied to predict CIN cell types (CGE, dMGE, and vMGE cells) at the regions of origin by using single-cell transcriptome sequence. Our findings revealed that CIN cell types could be successfully distinguished by their transcriptomic characteristics, especially the CGE cell, suggesting that the diversity of CIN is invoked in the original region before they migrate. Furthermore, a group of genes as well as their combined rules that are important for the prediction of CIN types at the regions of origin were identified and interpreted. Our research may not only provide novel biomarkers for CIN associated myoblasts subtyping but also contribute to deepening the understanding of CIN associated biological processes and related mechanisms.</p>
</sec>
<sec id="S6" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE109796">https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE109796</ext-link>.</p>
</sec>
<sec id="S7">
<title>Author contributions</title>
<p>TH and Y-DC designed the study. ZL, DW, WG, SZ, LC, and XP performed the experiments. ZL, DW, WG, Y-HZ, and LL analyzed the results. ZL, DW, and WG wrote the manuscript. All authors contributed to the research and reviewed the manuscript.</p>
</sec>
<sec id="conf1" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="pudiscl1" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<sec id="S8" sec-type="funding-information">
<title>Funding</title>
<p>This work was supported by the Strategic Priority Research Program of Chinese Academy of Sciences (XDB38050200, XDA26040304), the National Key R&#x0026;D Program of China (2018YFC0910403), and the Fund of the Key Laboratory of Tissue Microenvironment and Tumor of Chinese Academy of Sciences (202002).</p>
</sec>
<sec id="S9" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fnins.2022.841145/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fnins.2022.841145/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 1</label>
<caption><p>Feature list generated by mRMR method.</p></caption>
</supplementary-material>
<supplementary-material xlink:href="Table_2.XLSX" id="TS2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink">
<label>Supplementary Table 2</label>
<caption><p>Performance of RF and RIPPER classifiers with different top features in the list.</p></caption>
</supplementary-material>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Agoston</surname> <given-names>Z.</given-names></name> <name><surname>Li</surname> <given-names>N.</given-names></name> <name><surname>Haslinger</surname> <given-names>A.</given-names></name> <name><surname>Wizenmann</surname> <given-names>A.</given-names></name> <name><surname>Schulte</surname> <given-names>D.</given-names></name></person-group> (<year>2012</year>). <article-title>Genetic and physical interaction of Meis2, Pax3 and Pax7 during dorsal midbrain development.</article-title> <source><italic>BMC Dev. Biol.</italic></source> <volume>12</volume>:<issue>10</issue>. <pub-id pub-id-type="doi">10.1186/1471-213X-12-10</pub-id> <pub-id pub-id-type="pmid">22390724</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bae</surname> <given-names>C. J.</given-names></name> <name><surname>Park</surname> <given-names>B. Y.</given-names></name> <name><surname>Lee</surname> <given-names>Y. H.</given-names></name> <name><surname>Tobias</surname> <given-names>J. W.</given-names></name> <name><surname>Hong</surname> <given-names>C. S.</given-names></name> <name><surname>Saintjeannet</surname> <given-names>J. P.</given-names></name></person-group> (<year>2014</year>). <article-title>Identification of Pax3 and Zic1 targets in the developing neural crest.</article-title> <source><italic>Dev. Biol.</italic></source> <volume>386</volume> <fpage>473</fpage>&#x2013;<lpage>483</lpage>. <pub-id pub-id-type="doi">10.1016/j.ydbio.2013.12.011</pub-id> <pub-id pub-id-type="pmid">24360908</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bouilloux</surname> <given-names>F.</given-names></name> <name><surname>Thireau</surname> <given-names>J.</given-names></name> <name><surname>Vent&#x00E9;o</surname> <given-names>S.</given-names></name> <name><surname>Farah</surname> <given-names>C.</given-names></name> <name><surname>Karam</surname> <given-names>S.</given-names></name> <name><surname>Dauvilliers</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Loss of the transcription factor Meis1 prevents sympathetic neurons target-field innervation and increases susceptibility to sudden cardiac death.</article-title> <source><italic>eLife</italic></source> <volume>5</volume>:<issue>e11627</issue>. <pub-id pub-id-type="doi">10.7554/eLife.11627</pub-id> <pub-id pub-id-type="pmid">26857994</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Breiman</surname> <given-names>L.</given-names></name></person-group> (<year>2001</year>). <article-title>Random forests.</article-title> <source><italic>Mach. Learn.</italic></source> <volume>45</volume> <fpage>5</fpage>&#x2013;<lpage>32</lpage>.</citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Wang</surname> <given-names>S.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.-H.</given-names></name> <name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Xing</surname> <given-names>Z.-H.</given-names></name> <name><surname>Yang</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Identify key sequence features to improve CRISPR sgRNA efficacy.</article-title> <source><italic>IEEE Access</italic></source> <volume>5</volume> <fpage>26582</fpage>&#x2013;<lpage>26590</lpage>.</citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>W.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Dai</surname> <given-names>Q.</given-names></name></person-group> (<year>2021</year>). <article-title>iMPT-FDNPL: identification of membrane protein types with functional domains and a natural language processing approach.</article-title> <source><italic>Comput. Math. Methods Med.</italic></source> <volume>2021</volume>:<issue>7681497</issue>. <pub-id pub-id-type="doi">10.1155/2021/7681497</pub-id> <pub-id pub-id-type="pmid">34671418</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cohen</surname> <given-names>W. W.</given-names></name></person-group> (<year>1995</year>). &#x201C;<article-title>Fast Effective Rule Induction</article-title>,&#x201D; in <source><italic>In Proceedings of theTwelfth International Conference on Machine Learning.</italic></source> (<publisher-loc>California</publisher-loc>), <fpage>115</fpage>&#x2013;<lpage>123</lpage>.</citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Combeau</surname> <given-names>G.</given-names></name> <name><surname>Kreis</surname> <given-names>P.</given-names></name> <name><surname>Domenichini</surname> <given-names>F.</given-names></name> <name><surname>Amar</surname> <given-names>M.</given-names></name> <name><surname>Fossier</surname> <given-names>P.</given-names></name> <name><surname>Rousseau</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>The p21-activated kinase PAK3 forms heterodimers with PAK1 in brain implementing trans-regulation of PAK3 activity.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>287</volume>:<issue>30084</issue>. <pub-id pub-id-type="doi">10.1074/jbc.M112.355073</pub-id> <pub-id pub-id-type="pmid">22815483</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Das</surname> <given-names>G.</given-names></name> <name><surname>Yu</surname> <given-names>Q.</given-names></name> <name><surname>Hui</surname> <given-names>R.</given-names></name> <name><surname>Reuhl</surname> <given-names>K.</given-names></name> <name><surname>Gale</surname> <given-names>N. W.</given-names></name> <name><surname>Zhou</surname> <given-names>R.</given-names></name></person-group> (<year>2016</year>). <article-title>EphA5 and EphA6: regulation of neuronal and spine morphology.</article-title> <source><italic>Cell Biosci.</italic></source> <volume>6</volume>:<issue>48</issue>. <pub-id pub-id-type="doi">10.1186/s13578-016-0115-5</pub-id> <pub-id pub-id-type="pmid">27489614</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dipietrantonio</surname> <given-names>H. J.</given-names></name> <name><surname>Dymecki</surname> <given-names>S. M.</given-names></name></person-group> (<year>2009</year>). <article-title>Zic1 levels regulate mossy fiber neuron position and axon laterality choice in the ventral brain stem.</article-title> <source><italic>Neuroscience</italic></source> <volume>162</volume> <fpage>560</fpage>&#x2013;<lpage>573</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroscience.2009.02.082</pub-id> <pub-id pub-id-type="pmid">19303920</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Donnelly</surname> <given-names>C. J.</given-names></name> <name><surname>Park</surname> <given-names>M.</given-names></name> <name><surname>Spillane</surname> <given-names>M.</given-names></name> <name><surname>Yoo</surname> <given-names>S.</given-names></name> <name><surname>Pacheco</surname> <given-names>A.</given-names></name> <name><surname>Gomes</surname> <given-names>C.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Axonally Synthesized &#x03B2;-Actin and GAP-43 Proteins Support Distinct Modes of Axonal Growth.</article-title> <source><italic>J. Neurosci.</italic></source> <volume>33</volume> <fpage>3311</fpage>&#x2013;<lpage>3322</lpage>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.1722-12.2013</pub-id> <pub-id pub-id-type="pmid">23426659</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Flandin</surname> <given-names>P.</given-names></name> <name><surname>Zhao</surname> <given-names>Y.</given-names></name> <name><surname>Vogt</surname> <given-names>D.</given-names></name> <name><surname>Jeong</surname> <given-names>J.</given-names></name> <name><surname>Long</surname> <given-names>J.</given-names></name> <name><surname>Potter</surname> <given-names>G.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Lhx6 and Lhx8 Coordinately Induce Neuronal Expression of Shh that Controls the Generation of Interneuron Progenitors.</article-title> <source><italic>Neuron</italic></source> <volume>70</volume> <fpage>939</fpage>&#x2013;<lpage>950</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuron.2011.04.020</pub-id> <pub-id pub-id-type="pmid">21658586</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frank</surname> <given-names>E.</given-names></name> <name><surname>Hall</surname> <given-names>M.</given-names></name> <name><surname>Trigg</surname> <given-names>L.</given-names></name> <name><surname>Holmes</surname> <given-names>G.</given-names></name> <name><surname>Witten</surname> <given-names>I. H.</given-names></name></person-group> (<year>2004</year>). <article-title>Data mining in bioinformatics using Weka.</article-title> <source><italic>Bioinformatics</italic></source> <volume>20</volume> <fpage>2479</fpage>&#x2013;<lpage>2481</lpage>.</citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fuentealba</surname> <given-names>P.</given-names></name> <name><surname>Klausberger</surname> <given-names>T.</given-names></name> <name><surname>Karayannis</surname> <given-names>T.</given-names></name> <name><surname>Suen</surname> <given-names>W. Y.</given-names></name> <name><surname>Huck</surname> <given-names>J.</given-names></name> <name><surname>Tomioka</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Expression of COUP-TFII nuclear receptor in restricted GABAergic neuronal populations in the adult rat hippocampus.</article-title> <source><italic>J. Neurosci.</italic></source> <volume>30</volume>:<issue>1595</issue>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.4199-09.2010</pub-id> <pub-id pub-id-type="pmid">20130170</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gelman</surname> <given-names>D. M.</given-names></name> <name><surname>Mar&#x00ED;n</surname> <given-names>O.</given-names></name></person-group> (<year>2010</year>). <article-title>Generation of interneuron diversity in the mouse cerebral cortex.</article-title> <source><italic>Eur. J. Neurosci.</italic></source> <volume>31</volume> <fpage>2136</fpage>&#x2013;<lpage>2141</lpage>.</citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gorodkin</surname> <given-names>J.</given-names></name></person-group> (<year>2004</year>). <article-title>Comparing two K-category assignments by a K-category correlation coefficient.</article-title> <source><italic>Comput. Biol. Chem.</italic></source> <volume>28</volume> <fpage>367</fpage>&#x2013;<lpage>374</lpage>. <pub-id pub-id-type="doi">10.1016/j.compbiolchem.2004.09.006</pub-id> <pub-id pub-id-type="pmid">15556477</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Henning</surname> <given-names>A. N.</given-names></name> <name><surname>Haag</surname> <given-names>J. D.</given-names></name> <name><surname>Smits</surname> <given-names>B. M. G.</given-names></name> <name><surname>Gould</surname> <given-names>M. N.</given-names></name></person-group> (<year>2016</year>). <article-title>The Non-coding Mammary Carcinoma Susceptibility Locus, Mcs5c, Regulates Pappa Expression via Age-Specific Chromatin Folding and Allele-Dependent DNA Methylation.</article-title> <source><italic>PLoS Gen.</italic></source> <volume>12</volume>:<issue>e1006261</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1006261</pub-id> <pub-id pub-id-type="pmid">27537370</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hu</surname> <given-names>J. S.</given-names></name> <name><surname>Vogt</surname> <given-names>D.</given-names></name> <name><surname>Lindtner</surname> <given-names>S.</given-names></name> <name><surname>Sandberg</surname> <given-names>M.</given-names></name> <name><surname>Silberberg</surname> <given-names>S. N.</given-names></name> <name><surname>Jlr</surname> <given-names>R.</given-names></name></person-group> (<year>2017</year>). <article-title>Coup-TF1&#x0026;2 (Nr2f1 and Nr2f2) control subtype and laminar identity of MGE-derived neocortical interneurons.</article-title> <source><italic>Development</italic></source> <volume>144</volume>:<issue>2837</issue>.</citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jia</surname> <given-names>Y.</given-names></name> <name><surname>Zhao</surname> <given-names>R.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name></person-group> (<year>2020</year>). <article-title>Similarity-Based Machine Learning Model for Predicting the Metabolic Pathways of Compounds.</article-title> <source><italic>IEEE Access</italic></source> <volume>8</volume> <fpage>130687</fpage>&#x2013;<lpage>130696</lpage>.</citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kelsom</surname> <given-names>C.</given-names></name> <name><surname>Lu</surname> <given-names>W.</given-names></name></person-group> (<year>2013</year>). <article-title>Development and specification of GABAergic cortical interneurons.</article-title> <source><italic>Cell Biosci.</italic></source> <volume>3</volume>:<issue>19</issue>.</citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khodosevich</surname> <given-names>K.</given-names></name> <name><surname>Seeburg</surname> <given-names>P. H.</given-names></name> <name><surname>Monyer</surname> <given-names>H.</given-names></name></person-group> (<year>2009</year>). <article-title>Major Signaling Pathways in Migrating Neuroblasts.</article-title> <source><italic>Front. Mol. Neurosci.</italic></source> <volume>2</volume>:<issue>7</issue>. <pub-id pub-id-type="doi">10.3389/neuro.02.007.2009</pub-id> <pub-id pub-id-type="pmid">19668709</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>J. B.</given-names></name> <name><surname>Sig</surname> <given-names>C. J.</given-names></name> <name><surname>Yu</surname> <given-names>Y. M.</given-names></name> <name><surname>Nam</surname> <given-names>K.</given-names></name> <name><surname>Piao</surname> <given-names>C. S.</given-names></name> <name><surname>Kim</surname> <given-names>S. W.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>HMGB1, a novel cytokine-like mediator linking acute neuronal death and delayed neuroinflammation in the postischemic brain.</article-title> <source><italic>J. Neurosci.</italic></source> <volume>26</volume>:<issue>6413</issue>. <pub-id pub-id-type="doi">10.1523/JNEUROSCI.3815-05.2006</pub-id> <pub-id pub-id-type="pmid">16775128</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>S. W.</given-names></name> <name><surname>Lim</surname> <given-names>C. M.</given-names></name> <name><surname>Kim</surname> <given-names>J. B.</given-names></name> <name><surname>Shin</surname> <given-names>J. H.</given-names></name> <name><surname>Lee</surname> <given-names>S.</given-names></name> <name><surname>Lee</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>Extracellular HMGB1 released by NMDA treatment confers neuronal apoptosis via RAGE-p38 MAPK/ERK signaling pathway.</article-title> <source><italic>Neurotox. Res.</italic></source> <volume>20</volume> <fpage>159</fpage>&#x2013;<lpage>169</lpage>. <pub-id pub-id-type="doi">10.1007/s12640-010-9231-x</pub-id> <pub-id pub-id-type="pmid">21116767</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kobayashi</surname> <given-names>H.</given-names></name> <name><surname>Saragai</surname> <given-names>S.</given-names></name> <name><surname>Naito</surname> <given-names>A.</given-names></name> <name><surname>Ichio</surname> <given-names>K.</given-names></name> <name><surname>Kawauchi</surname> <given-names>D.</given-names></name> <name><surname>Murakami</surname> <given-names>F.</given-names></name></person-group> (<year>2014</year>). <article-title>Calm1 signaling pathway is essential for the migration of mouse precerebellar neurons.</article-title> <source><italic>Development</italic></source> <volume>142</volume> <fpage>375</fpage>&#x2013;<lpage>384</lpage>. <pub-id pub-id-type="doi">10.1242/dev.112680</pub-id> <pub-id pub-id-type="pmid">25519244</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kohavi</surname> <given-names>R.</given-names></name></person-group> (<year>1995</year>). &#x201C;<article-title>A study of cross-validation and bootstrap for accuracy estimation and model selection</article-title>,&#x201D; in <source><italic>International Joint Conference on Artificial Intelligence.</italic></source> (<publisher-loc>Mahwah</publisher-loc>: <publisher-name>Lawrence Erlbaum Associates Ltd</publisher-name>), <fpage>1137</fpage>&#x2013;<lpage>1145</lpage>.</citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Korshunova</surname> <given-names>I.</given-names></name> <name><surname>Caroni</surname> <given-names>P.</given-names></name> <name><surname>Kolkova</surname> <given-names>K.</given-names></name> <name><surname>Berezin</surname> <given-names>V.</given-names></name> <name><surname>Bock</surname> <given-names>E.</given-names></name> <name><surname>Walmod</surname> <given-names>P. S.</given-names></name></person-group> (<year>2010</year>). <article-title>Characterization of BASP1-mediated neurite outgrowth.</article-title> <source><italic>J. Neurosci. Res.</italic></source> <volume>86</volume> <fpage>2201</fpage>&#x2013;<lpage>2213</lpage>. <pub-id pub-id-type="doi">10.1002/jnr.21678</pub-id> <pub-id pub-id-type="pmid">18438920</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>J.</given-names></name> <name><surname>Lu</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.-H.</given-names></name> <name><surname>Xu</surname> <given-names>Y.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <name><surname>Feng</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Identification of leukemia stem cell expression signatures through Monte Carlo feature selection strategy and support vector machine.</article-title> <source><italic>Cancer Gene Ther.</italic></source> <volume>27</volume> <fpage>56</fpage>&#x2013;<lpage>69</lpage>. <pub-id pub-id-type="doi">10.1038/s41417-019-0105-y</pub-id> <pub-id pub-id-type="pmid">31138902</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liang</surname> <given-names>H.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Zhao</surname> <given-names>X.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name></person-group> (<year>2020</year>). <article-title>Prediction of drug side effects with a refined negative sample selection strategy.</article-title> <source><italic>Comput. Math. Methods Med.</italic></source> <volume>2020</volume>:<issue>1573543</issue>. <pub-id pub-id-type="doi">10.1155/2020/1573543</pub-id> <pub-id pub-id-type="pmid">32454877</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liu</surname> <given-names>H. A.</given-names></name> <name><surname>Setiono</surname> <given-names>R.</given-names></name></person-group> (<year>1998</year>). <article-title>Incremental feature selection.</article-title> <source><italic>Appl. Intell.</italic></source> <volume>9</volume> <fpage>217</fpage>&#x2013;<lpage>230</lpage>.</citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Machon</surname> <given-names>O.</given-names></name> <name><surname>Masek</surname> <given-names>J.</given-names></name> <name><surname>Machonova</surname> <given-names>O.</given-names></name> <name><surname>Krauss</surname> <given-names>S.</given-names></name> <name><surname>Kozmik</surname> <given-names>Z.</given-names></name></person-group> (<year>2015</year>). <article-title>Meis2 is essential for cranial and cardiac neural crest development.</article-title> <source><italic>BMC Dev. Biol.</italic></source> <volume>15</volume>:<issue>40</issue>. <pub-id pub-id-type="doi">10.1186/s12861-015-0093-6</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Magno</surname> <given-names>L.</given-names></name> <name><surname>Barry</surname> <given-names>C.</given-names></name> <name><surname>Schmidthieber</surname> <given-names>C.</given-names></name> <name><surname>Theodotou</surname> <given-names>P.</given-names></name> <name><surname>H&#x00E4;usser</surname> <given-names>M.</given-names></name> <name><surname>Kessaris</surname> <given-names>N.</given-names></name></person-group> (<year>2017</year>). <article-title>NKX2-1 Is Required in the Embryonic Septum for Cholinergic System Development, Learning, and Memory.</article-title> <source><italic>Cell Rep.</italic></source> <volume>20</volume>:<issue>1572</issue>. <pub-id pub-id-type="doi">10.1016/j.celrep.2017.07.053</pub-id> <pub-id pub-id-type="pmid">28813670</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Matthews</surname> <given-names>B. W.</given-names></name></person-group> (<year>1975</year>). <article-title>Comparison of the predicted and observed secondary structure of T4 phage lysozyme.</article-title> <source><italic>Biochim. Biophys. Acta</italic></source> <volume>405</volume> <fpage>442</fpage>&#x2013;<lpage>451</lpage>. <pub-id pub-id-type="doi">10.1016/0005-2795(75)90109-9</pub-id> <pub-id pub-id-type="pmid">1180967</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mayer</surname> <given-names>C.</given-names></name> <name><surname>Hafemeister</surname> <given-names>C.</given-names></name> <name><surname>Bandler</surname> <given-names>R. C.</given-names></name> <name><surname>Machold</surname> <given-names>R.</given-names></name> <name><surname>Batista Brito</surname> <given-names>R.</given-names></name> <name><surname>Jaglin</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Developmental diversification of cortical inhibitory interneurons.</article-title> <source><italic>Nature</italic></source> <volume>555</volume> <fpage>457</fpage>&#x2013;<lpage>462</lpage>.</citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mi</surname> <given-names>D.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Lim</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>M.</given-names></name> <name><surname>Moissidis</surname> <given-names>M.</given-names></name> <name><surname>Yang</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Early emergence of cortical interneuron diversity in the mouse embryo.</article-title> <source><italic>Science</italic></source> <volume>360</volume> <fpage>81</fpage>&#x2013;<lpage>85</lpage>.</citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Milet</surname> <given-names>C.</given-names></name> <name><surname>Maczkowiak</surname> <given-names>F.</given-names></name> <name><surname>Roche</surname> <given-names>D. D.</given-names></name> <name><surname>Monsoro-Burq</surname> <given-names>A. H.</given-names></name></person-group> (<year>2013</year>). <article-title>Pax3 and Zic1 drive induction and differentiation of multipotent, migratory, and functional neural crest in Xenopus embryos.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>110</volume> <fpage>5528</fpage>&#x2013;<lpage>5533</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1219124110</pub-id> <pub-id pub-id-type="pmid">23509273</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ostroumova</surname> <given-names>O. S.</given-names></name> <name><surname>Schagina</surname> <given-names>L. V.</given-names></name> <name><surname>Mosevitsky</surname> <given-names>M. I.</given-names></name> <name><surname>Zakharov</surname> <given-names>V. V.</given-names></name></person-group> (<year>2011</year>). <article-title>Ion channel activity of brain abundant protein BASP1 in planar lipid bilayers.</article-title> <source><italic>Febs J.</italic></source> <volume>278</volume> <fpage>461</fpage>&#x2013;<lpage>469</lpage>. <pub-id pub-id-type="doi">10.1111/j.1742-4658.2010.07967.x</pub-id> <pub-id pub-id-type="pmid">21156029</pub-id></citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pan</surname> <given-names>X.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Zeng</surname> <given-names>T.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Huang</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Identification of protein subcellular localization with network and functional embeddings.</article-title> <source><italic>Front. Gen</italic></source> <volume>11</volume>:<issue>626500</issue>. <pub-id pub-id-type="doi">10.3389/fgene.2020.626500</pub-id> <pub-id pub-id-type="pmid">33584818</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pan</surname> <given-names>X. Y.</given-names></name> <name><surname>Zhang</surname> <given-names>Y. N.</given-names></name> <name><surname>Shen</surname> <given-names>H. B.</given-names></name></person-group> (<year>2010</year>). <article-title>Large-scale prediction of human protein-protein interactions from amino acid sequence based on latent topic features.</article-title> <source><italic>J. Proteome Res.</italic></source> <volume>9</volume> <fpage>4992</fpage>&#x2013;<lpage>5001</lpage>. <pub-id pub-id-type="doi">10.1021/pr100618t</pub-id> <pub-id pub-id-type="pmid">20698572</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Peng</surname> <given-names>H. C.</given-names></name> <name><surname>Long</surname> <given-names>F. H.</given-names></name> <name><surname>Ding</surname> <given-names>C.</given-names></name></person-group> (<year>2005</year>). <article-title>Feature selection based on mutual information: Criteria of max-dependency, max-relevance, and min-redundancy.</article-title> <source><italic>IEEE Trans. Pattern Anal. Mach. Intell.</italic></source> <volume>27</volume> <fpage>1226</fpage>&#x2013;<lpage>1238</lpage>. <pub-id pub-id-type="doi">10.1109/TPAMI.2005.159</pub-id> <pub-id pub-id-type="pmid">16119262</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pfeffer</surname> <given-names>C. K.</given-names></name> <name><surname>Xue</surname> <given-names>M.</given-names></name> <name><surname>He</surname> <given-names>M.</given-names></name> <name><surname>Huang</surname> <given-names>Z. J.</given-names></name> <name><surname>Scanziani</surname> <given-names>M.</given-names></name></person-group> (<year>2013</year>). <article-title>Inhibition of inhibition in visual cortex: the logic of connections between molecularly distinct interneurons.</article-title> <source><italic>Nat. Neurosci.</italic></source> <volume>16</volume> <fpage>1068</fpage>&#x2013;<lpage>1076</lpage>. <pub-id pub-id-type="doi">10.1038/nn.3446</pub-id> <pub-id pub-id-type="pmid">23817549</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pi</surname> <given-names>H. J.</given-names></name> <name><surname>Hangya</surname> <given-names>B.</given-names></name> <name><surname>Kvitsiani</surname> <given-names>D.</given-names></name> <name><surname>Sanders</surname> <given-names>J. I.</given-names></name> <name><surname>Huang</surname> <given-names>Z. J.</given-names></name> <name><surname>Kepecs</surname> <given-names>A.</given-names></name></person-group> (<year>2013</year>). <article-title>Cortical interneurons that specialize in disinhibitory control.</article-title> <source><italic>Nature</italic></source> <volume>503</volume> <fpage>521</fpage>&#x2013;<lpage>524</lpage>.</citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ping</surname> <given-names>F.</given-names></name> <name><surname>Schachner</surname> <given-names>M.</given-names></name> <name><surname>Shen</surname> <given-names>Y. Q.</given-names></name></person-group> (<year>2012</year>). <article-title>HMGB1 in Development and Diseases of the Central Nervous System.</article-title> <source><italic>Mol. Neurobiol.</italic></source> <volume>45</volume> <fpage>499</fpage>&#x2013;<lpage>506</lpage>.</citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rodenas-Cuadrado</surname> <given-names>P. M.</given-names></name> <name><surname>Mengede</surname> <given-names>J.</given-names></name> <name><surname>Baas</surname> <given-names>L.</given-names></name> <name><surname>Devanna</surname> <given-names>P.</given-names></name> <name><surname>Schmid</surname> <given-names>T. A.</given-names></name> <name><surname>Yartsev</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Mapping the distribution of language related genes FoxP1, FoxP2, and CntnaP2 in the brains of vocal learning bat species.</article-title> <source><italic>J. Comp. Neurol.</italic></source> <volume>526</volume> <fpage>1235</fpage>&#x2013;<lpage>1266</lpage>. <pub-id pub-id-type="doi">10.1002/cne.24385</pub-id> <pub-id pub-id-type="pmid">29297931</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Taylor</surname> <given-names>A. M.</given-names></name> <name><surname>Humphries</surname> <given-names>J. M.</given-names></name> <name><surname>White</surname> <given-names>R. M.</given-names></name> <name><surname>Murphey</surname> <given-names>R. D.</given-names></name> <name><surname>Burns</surname> <given-names>C. E.</given-names></name> <name><surname>Zon</surname> <given-names>L. I.</given-names></name></person-group> (<year>2012</year>). <article-title>Hematopoietic defects in rps29 mutant zebrafish depend upon p53 activation.</article-title> <source><italic>Exp. Hematol.</italic></source> <volume>40</volume>:<issue>228</issue>. <pub-id pub-id-type="doi">10.1016/j.exphem.2011.11.007</pub-id> <pub-id pub-id-type="pmid">22120640</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tomioka</surname> <given-names>T.</given-names></name> <name><surname>Shimazaki</surname> <given-names>T.</given-names></name> <name><surname>Yamauchi</surname> <given-names>T.</given-names></name> <name><surname>Oki</surname> <given-names>T.</given-names></name> <name><surname>Ohgoh</surname> <given-names>M.</given-names></name> <name><surname>Okano</surname> <given-names>H.</given-names></name></person-group> (<year>2014</year>). <article-title>LIM Homeobox 8 (Lhx8) Is a Key Regulator of the Cholinergic Neuronal Function via a Tropomyosin Receptor Kinase A (TrkA)-mediated Positive Feedback Loop.</article-title> <source><italic>J. Biol. Chem.</italic></source> <volume>289</volume> <fpage>1000</fpage>&#x2013;<lpage>1010</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.M113.494385</pub-id> <pub-id pub-id-type="pmid">24265310</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>X. J.</given-names></name></person-group> (<year>2002</year>). <article-title>Probabilistic decision making by slow reverberation in cortical circuits.</article-title> <source><italic>Neuron</italic></source> <volume>36</volume> <fpage>955</fpage>&#x2013;<lpage>968</lpage>. <pub-id pub-id-type="doi">10.1016/s0896-6273(02)01092-9</pub-id> <pub-id pub-id-type="pmid">12467598</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wonders</surname> <given-names>C. P.</given-names></name> <name><surname>Anderson</surname> <given-names>S. A.</given-names></name></person-group> (<year>2006</year>). <article-title>The origin and specification of cortical interneurons.</article-title> <source><italic>Nat. Rev. Neurosci.</italic></source> <volume>7</volume> <fpage>687</fpage>&#x2013;<lpage>696</lpage>.</citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Y. H.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Zeng</surname> <given-names>T.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2021c</year>). <article-title>Identifying Transcriptomic Signatures and Rules for SARS-CoV-2 Infection.</article-title> <source><italic>Front. Cell. Dev. Biol.</italic></source> <volume>8</volume>:<issue>627302</issue>. <pub-id pub-id-type="doi">10.3389/fcell.2020.627302</pub-id> <pub-id pub-id-type="pmid">33505977</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Y.-H.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Zeng</surname> <given-names>T.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Li</surname> <given-names>H.</given-names></name> <name><surname>Huang</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2021a</year>). <article-title>Detecting the multiomics signatures of factor-specific inflammatory effects on airway smooth muscles.</article-title> <source><italic>Front. Gen.</italic></source> <volume>11</volume>:<issue>599970</issue>. <pub-id pub-id-type="doi">10.3389/fgene.2020.599970</pub-id> <pub-id pub-id-type="pmid">33519902</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Y.-H.</given-names></name> <name><surname>Zeng</surname> <given-names>T.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Huang</surname> <given-names>T.</given-names></name> <name><surname>Cai</surname> <given-names>Y.-D.</given-names></name></person-group> (<year>2021b</year>). <article-title>Determining protein&#x2013;protein functional associations by functional rules based on gene ontology and KEGG pathway.</article-title> <source><italic>Biochim. Biophy. Acta Proteins Proteom.</italic></source> <volume>1869</volume>:<issue>140621</issue>.</citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>Y.-H.</given-names></name> <name><surname>Li</surname> <given-names>Z.</given-names></name> <name><surname>Zeng</surname> <given-names>T.</given-names></name> <name><surname>Pan</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Liu</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Distinguishing glioblastoma subtypes by methylation signatures.</article-title> <source><italic>Front. Gen.</italic></source> <volume>11</volume>:<issue>604336</issue>. <pub-id pub-id-type="doi">10.3389/fgene.2020.604336</pub-id> <pub-id pub-id-type="pmid">33329750</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>X.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Lu</surname> <given-names>J.</given-names></name></person-group> (<year>2018</year>). <article-title>A similarity-based method for prediction of drug side effects with heterogeneous information.</article-title> <source><italic>Math.Biosci.</italic></source> <volume>306</volume> <fpage>136</fpage>&#x2013;<lpage>144</lpage>. <pub-id pub-id-type="doi">10.1016/j.mbs.2018.09.010</pub-id> <pub-id pub-id-type="pmid">30296417</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>Y.</given-names></name> <name><surname>Mar&#x00ED;n</surname> <given-names>O.</given-names></name> <name><surname>Hermesz</surname> <given-names>E.</given-names></name> <name><surname>Powell</surname> <given-names>A.</given-names></name> <name><surname>Flames</surname> <given-names>N.</given-names></name> <name><surname>Palkovits</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>The LIM-homeobox gene Lhx8 is required for the development of many cholinergic neurons in the mouse forebrain.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>100</volume> <fpage>9005</fpage>&#x2013;<lpage>9010</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1537759100</pub-id> <pub-id pub-id-type="pmid">12855770</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhou</surname> <given-names>J.-P.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Guo</surname> <given-names>Z.-H.</given-names></name></person-group> (<year>2020</year>). <article-title>iATC-NRAKEL: an efficient multi-label classifier for recognizing anatomical therapeutic chemical classes of drugs.</article-title> <source><italic>Bioinformatics</italic></source> <volume>36</volume> <fpage>1391</fpage>&#x2013;<lpage>1396</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz757</pub-id> <pub-id pub-id-type="pmid">31593226</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhu</surname> <given-names>Y.</given-names></name> <name><surname>Hu</surname> <given-names>B.</given-names></name> <name><surname>Chen</surname> <given-names>L.</given-names></name> <name><surname>Dai</surname> <given-names>Q.</given-names></name></person-group> (<year>2021</year>). <article-title>iMPTCE-Hnetwork: a multi-label classifier for identifying metabolic pathway types of chemicals and enzymes with a heterogeneous network.</article-title> <source><italic>Comput. Math. Methods Med.</italic></source> <volume>2021</volume>:<issue>6683051</issue>. <pub-id pub-id-type="doi">10.1155/2021/6683051</pub-id> <pub-id pub-id-type="pmid">33488764</pub-id></citation></ref>
</ref-list>
</back>
</article>