<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Earth Sci.</journal-id>
<journal-title>Frontiers in Earth Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Earth Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-6463</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">713803</article-id>
<article-id pub-id-type="doi">10.3389/feart.2021.713803</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Earth Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Improving Geospatial Agreement by Hybrid Optimization in Logistic Regression-Based Landslide Susceptibility Modelling</article-title>
<alt-title alt-title-type="left-running-head">Sun et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Geospatial Agreement by Optimized LR-LSM</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Sun</surname>
<given-names>Deliang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wen</surname>
<given-names>Haijia</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1023428/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Xu</surname>
<given-names>Jiahui</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Yalan</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Danzhou</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Jialan</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Key Laboratory of GIS Application Research, Chongqing Normal University, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Key Laboratory of New Technology for Construction of Cities in Mountain Area, Ministry of Education, Chongqing University, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>National Joint Engineering Research Center of Geohazards Prevention in the Reservoir Areas, Chongqing University, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>School of Civil Engineering, Chongqing University, <addr-line>Chongqing</addr-line>, <country>China</country>
</aff>
<aff id="aff5">
<label>
<sup>5</sup>
</label>Key Laboratory of Geographic Information Science (Ministry of Education), East China Normal University, <addr-line>Shanghai</addr-line>, <country>China</country>
</aff>
<aff id="aff6">
<label>
<sup>6</sup>
</label>Key Laboratory of Environmental Change and Natural Disaster, Ministry of Education, Beijing Normal University, <addr-line>Beijing</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1259287/overview">Faming Huang</ext-link>, Nanchang University, China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1370434/overview">Lihan Pan</ext-link>, Nanchang University, China</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1371587/overview">Sudesh Pundir</ext-link>, Pondicherry University, India</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Haijia Wen, <email>jhw@cqu.edu.cn</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Geohazards and Georisks, a section of the journal Frontiers in Earth Science</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>25</day>
<month>08</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>9</volume>
<elocation-id>713803</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>05</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>28</day>
<month>07</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Sun, Wen, Xu, Zhang, Wang and Zhang.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Sun, Wen, Xu, Zhang, Wang and Zhang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>This study aims to develop a logistic regression model of landslide susceptibility based on GeoDetector for dominant-factor screening and 10-fold cross validation for training sample optimization. First, Fengjie county, a typical mountainous area, was selected as the study area since it experienced 1,522 landslides from 2001 to 2016. Second, 22 factors were selected as the initial conditioning factors, and a geospatial database was established with a grid of 30&#xa0;m precision. Factor detection of the geographic detector and the stepwise regression method included in logistic regression were used to screen out the dominant factors from the database. Then, based on the sample dataset with a 1:10 ratio of landslides and nonlandslides, 10-fold cross validation was used to select the optimized sample to train the logistic regression model of landslide susceptibility in the study area. Finally, the accuracy and efficiency of the two models before and after screening out the dominant factors were evaluated and compared. The results showed that the total accuracy of the two models was both more than 0.9, and the area under the curve value of the receiver operating characteristic curve was more than 0.8, indicating that the models before and after screening factor both had high reliability and good prediction ability. Besides, the screened factors had an active leading role in the geospatial distribution of the historical landslide, indicating that the screened dominant factors have individual rationality. Improving the geospatial agreement between landslide susceptibility and actual landslide-prone by the screening of dominant factors and the optimization of the training samples, a simple, efficient, and reliable logistic-regression&#x2013;based landslide susceptibility model can be constructed.</p>
</abstract>
<kwd-group>
<kwd>landslide susceptibility</kwd>
<kwd>GeoDetector</kwd>
<kwd>dominant-factor screening</kwd>
<kwd>logistic regression</kwd>
<kwd>10-fold cross validation</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Fundamental Research Funds for the Central Universities<named-content content-type="fundref-id">10.13039/501100012226</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Highlights</title>
<p>
<list list-type="simple">
<list-item>
<p>&#x2022;A hybrid optimal LR model by GeoDetector dominant-factor screening and an optimal sample</p>
</list-item>
<list-item>
<p>&#x2022;Improved accuracy of the LR-based LSM model by hybrid optimization</p>
</list-item>
<list-item>
<p>&#x2022;Optimized LSM agreed well with the geospatial distribution of historical and new landslide events</p>
</list-item>
</list>
</p>
</sec>
<sec id="s2">
<title>Introduction</title>
<p>Among many types of geological disasters, such as land subsidence and mudslides, landslides are the most common ones (<xref ref-type="bibr" rid="B51">Abedi Gheshlaghi and Feizizadeh, 2021</xref>). Because they are frequent, destructive, and widespread, every country attaches great importance to the monitoring and prevention of landslides (<xref ref-type="bibr" rid="B27">Naemitabar and Zanganeh Asadi, 2021</xref>). About two-thirds of China&#x2019;s area is a mountainous region, where landslides are most prone to occur (<xref ref-type="bibr" rid="B14">Gautam et&#x20;al., 2021</xref>). From 2007 to 2019, it is conservatively estimated that the number of deaths/missing caused by landslides exceeded 7,900, with an average of more than 600 per year. According to statistics from the China Geological Environment Information Site, the economic loss is about 610 million dollars each&#x20;year.</p>
<p>The evaluation of landslide susceptibility is an important part of the whole process of landslide risk management, which has achieved the effect of preventing and reducing landslide losses (<xref ref-type="bibr" rid="B52">Feizizadeh et&#x20;al., 2014</xref>). With the development of geographic information science (GIS) technology, scholars have actively explored landslide susceptibility mapping (LSM) methods (<xref ref-type="bibr" rid="B21">Li et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B49">Zhao et&#x20;al., 2021</xref>). So far, dozens of landslide susceptibility mapping (LSM) methods have been developed, which can be divided into several categories, including statistical methods, expert-based methods, and data mining methods (<xref ref-type="bibr" rid="B20">Kalantar et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B24">Ma and Xu, 2019</xref>). <xref ref-type="bibr" rid="B17">Huang et&#x20;al. (2020)</xref>, <xref ref-type="bibr" rid="B44">Wubalem (2021)</xref>, <xref ref-type="bibr" rid="B19">Huangfu et&#x20;al. (2021)</xref>, and <xref ref-type="bibr" rid="B32">Soma et&#x20;al. (2019)</xref> used semisupervised multiple-layer perceptron, information value, a multiple logistic regression algorithm, frequency ratio (FR), and logistic regression (LR) models to produce LSM. Among these different evaluation methods, the most common and reliable one is logistic regression (<xref ref-type="bibr" rid="B3">Ayalew and Yamagishi, 2005</xref>; <xref ref-type="bibr" rid="B20">Kalantar et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B30">Shan et&#x20;al., 2020</xref>). Some scholars have discovered that the longitude of LRM can be improved by changing the parameters or models that optimize LRM. <xref ref-type="bibr" rid="B13">Feby et&#x20;al. (2020)</xref> optimized the logistic regression model by spatially integrated evidential belief function. The ROC-AUC value of the optimized model is 0.935, which is more satisfactory than the traditional model. The results of LSM research are not only affected by the selected model but also closely related to the choice of conditioning factors (<xref ref-type="bibr" rid="B46">Xie et&#x20;al., 2021</xref>). <xref ref-type="bibr" rid="B29">Reichenbach et&#x20;al. (2018)</xref> found that a total of 596 conditioning factors were considered in the existing work, with an average of nine condition factors in each model. In the existing research, the selection of condition factors is mostly determined by expert experience, which is very subjective (<xref ref-type="bibr" rid="B5">Bourenane et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B26">Morales et&#x20;al., 2021</xref>; <xref ref-type="bibr" rid="B49">Zhao et&#x20;al., 2021</xref>). The current research lacks a general framework to objectively select the condition factors. Therefore, how to screen out dominant factors more objectively and quickly and then build a more stable and reliable model is the focus of current research.</p>
<p>Among the methods for factor screening in existing research, GeoDetector is a very common one (<xref ref-type="bibr" rid="B50">Zhou et&#x20;al., 2021</xref>). <xref ref-type="bibr" rid="B7">Chi et&#x20;al. (2021)</xref> analyzed the influence of specific geographical factors on the spatial distribution of terrestrial mammalian richness using the GeoDetector model. <xref ref-type="bibr" rid="B41">Wang et&#x20;al. (2021)</xref> used GeoDetector to identify spatial relationships among the influencing factors about soil heavy metal As. <xref ref-type="bibr" rid="B33">Sun et&#x20;al. (2021c)</xref> constructed the LSM model in Fengjie County by selected fundamental influencing factors, which are screened by GeoDetector and recursive feature elimination. Although the logistic regression model has a large number of applications in the field of LSM, due to the limitation of the model itself, it has limitations in dealing with a large number of conditioning factors with multicollinearity (<xref ref-type="bibr" rid="B35">Sun et&#x20;al., 2021b</xref>). In addition, in the existing research, there is no article about the combining usage of GeoDetectors and logistic regression.</p>
<p>Based on previous researches, this paper aims to propose an optimized landslide susceptibility evaluation model. This study takes Fengjie County as the study area, systematically considers the formation conditions of the landslide, and selects the conditioning factors as comprehensively as possible when conditions permit. Then, through the combination of GeoDetector and the stepwise regression method, the characteristic disaster conditioning factors are screened. Then, the 10-fold cross-validation method is used to select the best training sample. After training, an optimized logistic regression model of landslide sensitivity is obtained, and finally, the optimized model is evaluated through GIS software in the study&#x20;area.</p>
</sec>
<sec sec-type="materials" id="s3">
<title>Materials</title>
<sec id="s3-1">
<title>Study Area</title>
<p>Fengjie County of Chongqing, with typical mountainous landforms, is located in the east of the Sichuan Basin, the upper reaches of the Yangtze River (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). It is the junction of the Dabashan arc fold fault zone and east Sichuan arc concave fold zone, with the sophisticated structural stress field. The range of elevation is 87&#x2013;2,125&#xa0;m, which is higher in the terrain in the north than that in the south in general. It is located in the subtropical monsoon climate zone, with an annual average precipitation of 1,132&#xa0;mm in many&#x20;years.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Location of the study&#x20;area.</p>
</caption>
<graphic xlink:href="feart-09-713803-g001.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>Data</title>
<p>The data of landslides in Fengjie County were obtained from the Chongqing Geological Environment Monitoring Station. Its attributes contained the landslide name, coordinates, elevation, and time of occurrence. The 1:200,000/1:50,000 geological map of the China Geological Information Library (available online: <ext-link ext-link-type="uri" xlink:href="http://ngac.org.cn/">http://ngac.org.cn/</ext-link>) provides a reference basis for the site investigation of landslides in terms of regional geological environment, geological structure, and stratigraphic lithology. The data of Chongqing points of interest (POI) were obtained using a python program or foot written according to certain rules that can automatically capture World Wide Web information. These activity points are standard for various types of commercial and educational activities that can represent human engineering activities, such as hospitals, primary and secondary schools, business centers, parks and squares, and so on. Also, the time range was consistent with the historical landslides. Other primary data information is shown in <xref ref-type="table" rid="T1">Table&#x20;1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Data and data sources.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Data name</th>
<th align="center">Data sources</th>
<th align="center">Resolution</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Landslide</td>
<td align="left">Chongqing Geological Environment Monitoring Station</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">Elevation</td>
<td align="left">Aster satellite</td>
<td align="center">30&#xa0;m</td>
</tr>
<tr>
<td align="left">Geological data</td>
<td align="left">China Geological Information Library</td>
<td align="center">1:50 000 &#x223c; 1:200 000</td>
</tr>
<tr>
<td align="left">Land cover</td>
<td align="left">Chongqing Municipal Bureau of Land and Resources</td>
<td align="center">1:100 000</td>
</tr>
<tr>
<td align="left">Administrative division</td>
<td align="left">Chongqing Municipal Bureau of Land and Resources</td>
<td align="center">1:100 000</td>
</tr>
<tr>
<td align="left">River network</td>
<td align="left">Chongqing Water Resources Bureau</td>
<td align="center">1:100 000</td>
</tr>
<tr>
<td align="left">Satellite image</td>
<td align="left">Geospatial Data Cloud platform</td>
<td align="center">30&#xa0;m</td>
</tr>
<tr>
<td align="left">Annual rainfall</td>
<td align="left">Chongqing Meteorological Administration</td>
<td align="center">&#x2014;</td>
</tr>
<tr>
<td align="left">Road</td>
<td align="left">Chongqing Transportation Commission</td>
<td align="center">1:100 000</td>
</tr>
<tr>
<td align="left">POI</td>
<td align="left">Web Crawler</td>
<td align="center">&#x2014;</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="methods" id="s4">
<title>Methodology</title>
<sec id="s4-1">
<title>Study Flowchart</title>
<p>In this study, Fengjie County, a typical mountainous county in the Three Gorges Reservoir area of China, was chosen as a test site to carry out the research. The methodological flowchart is shown in <xref ref-type="fig" rid="F2">Figure&#x20;2</xref>. Firstly, we selected 22 factors as the initial conditioning factors for LSM, which were derived from a satellite image, a DEM, geological data including lithology and faults, and other multisource data. Secondly, a geospatial database was established based on all data (including landslides and nonlandslides). By including geographic factor detection into a stepwise logistic regression (LR) procedure, screening out the dominant factors was then performed. Then, 10-fold cross validation was used to select the optimized training sample to generate the LSM in the study area. Then, a stable LR model with dominant factors was applied for higher accuracy and stability. Finally, the accuracy of the two models before and after optimization was evaluated and used for&#x20;LSM.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Methodological flowchart used in this&#x20;study.</p>
</caption>
<graphic xlink:href="feart-09-713803-g002.tif"/>
</fig>
</sec>
<sec id="s4-2">
<title>Logistic Regression Model</title>
<p>Logistic regression (LR) is a generalized linear regression analysis method suitable for multivariable control. Different from the general linear regression model, the logical regression model restricts the output value to the interval [0,1] through the sigmoid function. Therefore, <italic>f(z)</italic>, representing the probability of landslide susceptibility, can be expressed by the following equation:<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>z</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>z</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>where <italic>z &#x3d; w1x1&#x2b; w2x2&#x2b;&#x2026;&#x2b;wMxM &#x2b; b</italic> is a weighted linear combination model. b is a constant number, which is the intercept of a function. <italic>wM</italic> (M &#x3d; 1,2,3,&#x2026;,22) is the correlation coefficient of the function. The independent variable <italic>xM</italic> (M &#x3d; 1,2,3,&#x2026;,22) represents 22 landslide conditioning factors. When the <italic>f(z)</italic> value is 1, it means that a landslide will surely occur, and when it is 0, it means no landslide will occur (<xref ref-type="bibr" rid="B20">Kalantar et&#x20;al., 2018</xref>).</p>
<p>The LR model includes the stepwise regression method to screen and eliminate the variables, thus eliminating multicollinearity and obtained significant factors. The stepwise regression is of three steps. The first step is introducing variables into the model one by one. Second, an F test is performed after introducing each explanatory variable. The final step is to perform a t-test on the explanatory variables already in the model. Once the newly added explanatory variable causes the previous explanatory variable to be no longer significant, it shall be eliminated to ensure that only essential variables are included in the regression equation before introducing each new variable.</p>
</sec>
<sec id="s4-3">
<title>GeoDetector</title>
<p>The GeoDetector is a statistical method proposed by Wang in 2010 (<xref ref-type="bibr" rid="B43">Wang et&#x20;al., 2010</xref>), which is used to detect spatial differentiation, revealing its driving force based on four detectors: differentiation and factor detection, interaction detection, risk-area detection, and ecological detection. This method can work both on numerical and qualitative data. In this study, to improving geospatial agreement between landslide and its conditioning factors, the factor detection function was used to screen the landslide dominant factor.</p>
<p>The general assumption of landslide factors screening using the GeoDetector can be expressed as follows: if a conditioning factor controls or contributes to a landslide, the geospatial distribution should be similar to a certain extent between the conditioning factor and the landslide. The similarity between the two is determined by the local and global variance (<xref ref-type="bibr" rid="B23">Luo and Liu, 2018</xref>). Let X be a layer of data representing the impact factors (e.g., lithology or slope) of our interests and the binary variable Y quantitatively represent the spatial distribution of the landslide. X needs to be either a category layer (for example, lithology) or can be transformed into a category zone (for example, a continuous slope can be divided into three areas: gentle, moderate, and steep). Overlaying Y and X layers subdivide Y according to the area of&#x20;X.</p>
<p>If the factor X is related to Y, then Y will exhibit a spatial distribution similar to that of X. In the perfect case, factor X thoroughly explains the pattern of Y, the value of Y is uniform in each region of X, and the spatial variance of Y in all regions is 0. In reality, the degree of spatial correspondence between X and Y is measured by the degree of interpretation of factor X, which is defined as<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:mi>q</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>S</mml:mi>
</mml:msubsup>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>m</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:msup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>S</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
<disp-formula id="e3">
<mml:math id="m3">
<mml:mrow>
<mml:mi mathvariant="normal">WSS</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>S</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>m</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">TSS&#x3d;</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>N</mml:mi>
<mml:msup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
<disp-formula id="e4">
<mml:math id="m4">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>m</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="true">&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mi>m</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
<disp-formula id="e5">
<mml:math id="m5">
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>N</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>Y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>where m &#x3d; 1,&#x2026;, S is the layering of variable Y or factor X, that is, classification or partition; N<sub>m</sub> and N are the layer m and the number of units in the whole area; and <inline-formula id="inf1">
<mml:math id="m10">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mi>m</mml:mi>
<mml:mn>2</mml:mn>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf2">
<mml:math id="m11">
<mml:mrow>
<mml:msup>
<mml:mi>&#x3c3;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>are the layer m and the variance of the Y value for the entire region, respectively. Within Sum of Squares (WSS) is the sum of the variances within the stratum, and the Total Sum of Squares (TSS) is the total variance of the entire region. Y<sub>m, i</sub> is the value of Y in the ith unit of layer m, and<inline-formula id="inf3">
<mml:math id="m12">
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>m</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="true">&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the average value of variable Y in layer m. <inline-formula id="inf4">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mi>Y</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the Y value&#x20;of the <italic>j</italic>th unit of the whole study area, and <inline-formula id="inf5">
<mml:math id="m14">
<mml:mrow>
<mml:mover accent="true">
<mml:mi>Y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> is the total average of the variable Y in the whole study area. The range of q is [0,&#x20;1].</p>
</sec>
<sec id="s4-4">
<title>10-Fold Cross Validation</title>
<p>10-fold cross validation, used to test the accuracy of the algorithm, is a common test method. The dataset was divided into ten parts, nine of which were used as training data and one as test data in&#x20;turn.</p>
<p>The correct rate (or error rate) will be obtained for each test. The average value of the accuracy of the results 10&#x20;times is used as the estimation of the accuracy of the algorithm. Generally, multiple 10-fold cross validations (for example, 10-fold cross validation) are needed, and then, the average value is calculated as the estimation of the accuracy of the algorithm.</p>
</sec>
</sec>
<sec id="s5">
<title>Modeling Process</title>
<sec id="s5-1">
<title>Geospatial Database</title>
<p>The landslide&#x2019;s occurrence is affected by both the internal geographical environmental factors and external disturbance environmental factors (<xref ref-type="bibr" rid="B38">Tsangaratos et&#x20;al., 2017</xref>). The internal factors include topographic and geological conditions, while the external factors include human engineering activities, rainfall, and reservoir water level changes. Based on comprehensive consideration of various factors and the actual conditions of the study area, 22 factors were selected as the initial conditioning factors including topography (elevation, slope, degree of relief, aspect, slope position, landforms, curvature, profile curvature, plan curvature, terrain roughness index (TRI), topographic wetness index (TWI), sediment transport index (STI), and stream power index (SPI)), geology (lithology, distance from fault, and combination reclassification of the stratum dip direction and slope aspect (CRDS)), environmental conditions (normalized vegetation index (NDVI), distance from hydrographic net, annual average rainfall, and land cover), and human activities (distance from roads and POI kernel density). All the 22 conditioning factors mentioned above were used to create the geospatial database with GIS software (<xref ref-type="bibr" rid="B33">Sun et&#x20;al., 2021c</xref>).</p>
<p>Here, slope, degree of relief, aspect, slope position, landforms, curvature, profile curvature, plan curvature, terrain roughness index (TRI) (<xref ref-type="bibr" rid="B1">Althuwaynee et&#x20;al., 2014</xref>), topographic wetness index (TWI) (<xref ref-type="bibr" rid="B48">Yilmaz 2009</xref>; <xref ref-type="bibr" rid="B16">Hong et&#x20;al., 2016</xref>), sediment transport index (STI) (<xref ref-type="bibr" rid="B28">Pourghasemi et&#x20;al., 2012</xref>), and stream power index (SPI) (<xref ref-type="bibr" rid="B25">Moore and Wilson, 1992</xref>) were based on the processing of the DEM with 30&#xa0;m resolution. Lithology and faults were extracted by geological maps with scales of 1:50,000&#x2013;1:200,000. The distances from faults, hydrographic nets, and roads were generated after buffering the faults, river networks, and roads, respectively. The selection of buffer distance was based on field surveys, imagery resolution, and previous research (<xref ref-type="bibr" rid="B45">Xie et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B36">Sun et&#x20;al., 2021a</xref>). CRDS (<xref ref-type="bibr" rid="B35">Sun et&#x20;al., 2021b</xref>) was generated by subtraction and reclassification of aspect and tendency. NDVI was calculated using landsat8 OLI data with a resolution of 30&#xa0;m. Annual average rainfall was generated by the spatial interpolation method from the original data. POI kernel density was generated by kernel density calculation of POI point data, which refers to any nongeographical meaningful points on the map (<xref ref-type="bibr" rid="B35">Sun et&#x20;al., 2021b</xref>).</p>
<p>Moreover, to reduce the disadvantageous effects on the model caused by data discretization, reclassification was performed for the 13 continuous variables, including elevation, slope, degree of relief, curvature, profile curvature, plan curvature, TRI, TWI, STI, SPI, NDVI, annual average rainfall, and POI kernel density. Here, based on research experiences, the reclassification threshold value of each factor obtained by the natural breakpoint method was followed to slightly adjust by counting the number of historical landslide points under each category to agree with the actual situation as much as possible. The other nine factors, which were originally classified, could directly be processed. A classification scheme used was established for each continuous factor. To sum up, a spatial database of landslide conditioning factors after reclassification was constructed in a 30&#xa0;m resolution grid cell. The thematic map of landslide influencing factors is shown in <xref ref-type="fig" rid="F3">Figure&#x20;3</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Thematic map of landslide influencing factors: <bold>(A)</bold> aspect; <bold>(B)</bold> CRDS; <bold>(C)</bold> curvature; <bold>(D)</bold> elevation; <bold>(E)</bold> distance from faults; <bold>(F)</bold> distance from hydrographic net; <bold>(G)</bold> landcover; <bold>(H)</bold> microlandform; <bold>(I)</bold> lithology; <bold>(J)</bold> NDVI; <bold>(K)</bold> plan curvature; <bold>(L)</bold> POI; <bold>(M)</bold> profile curvature; <bold>(N)</bold> relief; <bold>(O)</bold> annual average rainfall; <bold>(P)</bold> slope; <bold>(Q)</bold> slope position; <bold>(R)</bold> SPI; <bold>(S)</bold> STI; <bold>(T)</bold> TRI; <bold>(U)</bold> TWI; and <bold>(V)</bold> distance from&#x20;roads.</p>
</caption>
<graphic xlink:href="feart-09-713803-g003.tif"/>
</fig>
<p>To reduce the affection of the logistic regression model by factor data discreteness, all the 22 factors after reclassification were normalized to [0,1] by <xref ref-type="disp-formula" rid="e6">the</xref> following equation:<disp-formula id="e6">
<mml:math id="m22">
<mml:mrow>
<mml:msup>
<mml:mi>X</mml:mi>
<mml:mo>&#x2217;</mml:mo>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
</mml:mrow>
<mml:mi>X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>/</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
</mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>where <italic>X&#x2a;</italic> is the normalized data; <italic>X</italic> is the original data; <italic>X</italic>
<sub>min</sub> is the minimum value of data; and <italic>X</italic>
<sub>max</sub> is the maximum value of&#x20;data.</p>
</sec>
<sec id="s5-2">
<title>Preparation of the Sample Dataset</title>
<p>In the study, landslide cells (positive cells) and no-landslide cells (negative cells) made up all datasets. Landslide cells consisted of 1,522 historical landslide events, each of which was regarded as a single cell. Because of the geometric effect, all landslide cells were excluded by setting a 500&#xa0;m buffer zone for all the 1,522 landslide points, and the remaining areas were regarded as the no-landslide areas (<xref ref-type="bibr" rid="B45">Xie et&#x20;al., 2018</xref>). Researchers have different opinions on the ratio between landslide and nonlandslide cells, but the most widely used ratios are 1: 1, 1: 5, and 1:10 between landslide and no-landslide cells, and the last ratio of 1:10 was selected by this study after many experiments. 15,220 nonlandslide cells were randomly extracted from the no-landslide&#x20;area.</p>
</sec>
<sec id="s5-3">
<title>Model Optimization</title>
<sec id="s5-3-1">
<title>Dominant-Factor Screening and Preliminary Training</title>
<p>The process of preliminary training: according to a 7: 3 ratio, all sample datasets were divided into a training dataset (11,720) and a test dataset (5,022). The training dataset was used for LR model training, and the test dataset was used for testing.</p>
<p>1) The stepwise regression method included in the LR: 22 initial conditioning factors were subjected to stepwise regression training of the LR<sub>a</sub> model (ordinary model). The conditioning factors were introduced into the equation one by one. All conditioning factors in the equation were tested one by one, and the insignificant conditioning factors were removed from the equation one by one. In the final equation, some conditioning factors that had a significant influence on the Y value of the landslide remained, and others that had no significant influence on the Y value of the landslide were omitted. Also, 11 factors were preliminarily selected by passing the test of the significance level of 0.05, which are topographic (elevation, degree of relief, slope, SRI, and SPI), geological conditions (lithology, distance from fault, and CRDS), environmental conditions (land cover), and human activities (distance from roads and POI kernel density).</p>
<p>2) The factor detection method of the GeoDetector: based on the R language, we used the GeoDetector to detect all datasets, including 22 initial conditioning factors. The results are shown in <xref ref-type="table" rid="T2">Table&#x20;2</xref>. The <italic>p</italic> value represents the significance level, and the q value represents the explanatory factor power, i.e.,&#x20;the influence degree of conditioning factors on the landslide. We found that SPI and STI failed the significance test (<italic>p</italic>&#x20;&#x3e; 0.05). Therefore, we eliminated these two nonsignificant and least explanatory factors directly. The remaining 20 factors passed the significance test (<italic>p</italic>&#x20;&#x3d; 0.000) and can be so in subsequent experiments.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Factor detector results.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Conditioning factor</th>
<th align="center">q value</th>
<th align="center">
<italic>p</italic> value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Annual average rainfall</td>
<td align="char" char=".">0.080</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Elevation</td>
<td align="char" char=".">0.077</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Lithology</td>
<td align="char" char=".">0.061</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">POI kernel density</td>
<td align="char" char=".">0.056</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Distance from road</td>
<td align="char" char=".">0.029</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Landcover</td>
<td align="char" char=".">0.022</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Distance from hydrographic net</td>
<td align="char" char=".">0.013</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Distance from fault</td>
<td align="char" char=".">0.010</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Slope</td>
<td align="char" char=".">0.010</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Degree of relief</td>
<td align="char" char=".">0.008</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">TRI</td>
<td align="char" char=".">0.006</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">TWI</td>
<td align="char" char=".">0.004</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Plan curvature</td>
<td align="char" char=".">0.003</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Curvature</td>
<td align="char" char=".">0.003</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Landforms</td>
<td align="char" char=".">0.002</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">NDVI</td>
<td align="char" char=".">0.002</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Profile curvature</td>
<td align="char" char=".">0.002</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Aspect</td>
<td align="char" char=".">0.002</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">CRDS</td>
<td align="char" char=".">0.002</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">Slope position</td>
<td align="char" char=".">0.001</td>
<td align="char" char=".">0.000</td>
</tr>
<tr>
<td align="left">SPI</td>
<td align="char" char=".">0.000</td>
<td align="char" char=".">0.228</td>
</tr>
<tr>
<td align="left">STI</td>
<td align="char" char=".">0.000</td>
<td align="char" char=".">0.487</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>
<xref ref-type="fig" rid="F4">Figure&#x20;4</xref> shows the factor detection results of the significant factors in descending order of q value. In conjunction with <xref ref-type="table" rid="T2">Table&#x20;2</xref>, we found that the annual average rainfall and elevation were two important control factors for the spatial differentiation of Y values of landslides. Their q values (the ability to explain factors) were all greater than 0.075. The q values of the topographical conditions (except elevation), part of geological conditions (distance from fault, CRDS), and environmental conditions (NDVI) were less than or equal to 0.01. From the slope of the curve in <xref ref-type="fig" rid="F4">Figure&#x20;4</xref>, the slope after distance from fault is almost 0, which means that the following 13 factors explain the spatial differentiation of landslides very little and can be ignored and eliminated directly. Therefore, the seven dominant factors (annual average rainfall, elevation, lithology, POI kernel density, distance from road, land cover, and distance from hydrographic net) were selected and placed in the LR<sub>b</sub> model (the model optimized by the GeoDetector). Moreover, we use these seven factors for stepwise regression training included in LR. All factors were retained, which means the dominant factors screened by the GeoDetector had vast differences from each&#x20;other.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Factor detector results.</p>
</caption>
<graphic xlink:href="feart-09-713803-g004.tif"/>
</fig>
</sec>
<sec id="s5-3-2">
<title>Optimal Training Sample Based on 10-Fold Cross Validation</title>
<p>To reduce the influence of a single sampling on results, the 10-fold cross-validation method was used to select the training sample and test sample. The 10-fold cross-validation method divided the sample dataset (1,522 positive cells and 15,220 negative cells) into ten disjoint subsets randomly and averagely. One subset was tested each time, and the rest subsets were used for model training.</p>
<p>Based on the R language, we build two LR models of whether to use the GeoDetector (LR<sub>a</sub> was not used and LR<sub>b</sub> was used). <xref ref-type="table" rid="T3">Table&#x20;3</xref> shows the accuracy of the 10-fold cross validation of the two models. The average accuracy of the training dataset and test dataset of the LR<sub>a</sub> model was 0.908 and 0.910, while the average accuracy of both the training dataset and test dataset of the LR<sub>b</sub> model was 0.910. Thus, from the average accuracy, we found that the model using the GeoDetector to screen dominant factors can maintain high accuracy and high stability. For the test dataset, the accuracy of sample No.1 (0.916) of the LR<sub>a</sub> model and sample No.4 (0.929) of the LRb model was relatively higher. Therefore, we decided to use the two samples as the optimal training samples to get the final models (LR<sub>ao</sub> and LR<sub>bo</sub>), which were based on dominant-factor screening and the optimal training samples.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>The accuracy of 10-fold cross validation of the two models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">LR<sub>a</sub>
</th>
<th colspan="2" align="center">Accuracy</th>
<th rowspan="2" align="center">LR<sub>b</sub>
</th>
<th colspan="2" align="center">Accuracy</th>
</tr>
<tr>
<th align="center">Training dataset</th>
<th align="center">Test dataset</th>
<th align="center">Training dataset</th>
<th align="center">Test dataset</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">1</td>
<td align="char" char=".">0.908</td>
<td align="char" char=".">0.916</td>
<td align="center">1</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.899</td>
</tr>
<tr>
<td align="left">2</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.910</td>
<td align="center">2</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.904</td>
</tr>
<tr>
<td align="left">3</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.914</td>
<td align="center">3</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.907</td>
</tr>
<tr>
<td align="left">4</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.906</td>
<td align="center">4</td>
<td align="char" char=".">0.907</td>
<td align="char" char=".">0.929</td>
</tr>
<tr>
<td align="left">5</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.910</td>
<td align="center">5</td>
<td align="char" char=".">0.911</td>
<td align="char" char=".">0.900</td>
</tr>
<tr>
<td align="left">6</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.902</td>
<td align="center">6</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.906</td>
</tr>
<tr>
<td align="left">7</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.910</td>
<td align="center">7</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.903</td>
</tr>
<tr>
<td align="left">8</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.911</td>
<td align="center">8</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.916</td>
</tr>
<tr>
<td align="left">9</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.911</td>
<td align="center">9</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.914</td>
</tr>
<tr>
<td align="left">10</td>
<td align="char" char=".">0.899</td>
<td align="char" char=".">0.910</td>
<td align="center">10</td>
<td align="char" char=".">0.909</td>
<td align="char" char=".">0.918</td>
</tr>
<tr>
<td align="left">Mean</td>
<td align="char" char=".">0.908</td>
<td align="char" char=".">0.910</td>
<td align="center">Mean</td>
<td align="char" char=".">0.910</td>
<td align="char" char=".">0.910</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s5-3-3">
<title>Final Optimal Models</title>
<p>The two final models (LR<sub>ao</sub> and LR<sub>bo</sub>) were different. Specifically, the former is an LR model that only performed a stepwise regression on 22 initial conditioning factors to remove insignificant factors, while the latter used the GeoDetector to screen out seven dominant factors first and then performed stepwise regression. The correlation coefficients and function intercept values of the factors of the two final models are shown in <xref ref-type="table" rid="T4">Tables 4</xref>,&#x20;<xref ref-type="table" rid="T5">5</xref>.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>The correlation coefficients and function intercept values of LR<sub>ao</sub>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Influencing factor</th>
<th align="center">Correlation coefficient</th>
<th align="center">Influencing factor</th>
<th align="center">Correlation coefficient</th>
<th align="center">Influencing factor</th>
<th align="center">Correlation coefficient</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Intercept (&#x3b2;<sub>a</sub>)</td>
<td align="char" char=".">&#x2212;1.76293</td>
<td align="left">TRI (aw<sub>4</sub>)</td>
<td align="char" char=".">&#x2212;1.07045</td>
<td align="left">Land cover (aw<sub>8</sub>)</td>
<td align="char" char=".">&#x2212;0.66213</td>
</tr>
<tr>
<td align="left">Elevation (aw<sub>1</sub>)</td>
<td align="char" char=".">&#x2212;2.42323</td>
<td align="left">Lithology (aw<sub>5</sub>)</td>
<td align="char" char=".">&#x2212;3.24346</td>
<td align="left">Distance from road (aw<sub>9</sub>)</td>
<td align="char" char=".">&#x2212;1.08878</td>
</tr>
<tr>
<td align="left">Degree of relief (aw<sub>2</sub>)</td>
<td align="char" char=".">&#x2212;1.91424</td>
<td align="left">Distance from fault (aw<sub>6</sub>)</td>
<td align="char" char=".">1.51187</td>
<td align="left">POI kernel density (aw<sub>10</sub>)</td>
<td align="char" char=".">1.54395</td>
</tr>
<tr>
<td align="left">Slope (aw<sub>3</sub>)</td>
<td align="char" char=".">2.59564</td>
<td align="left">CRDS (aw<sub>7</sub>)</td>
<td align="char" char=".">&#x2212;0.45871</td>
<td align="left">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>The correlation coefficients and function intercept values of LR<sub>bo</sub>.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Influencing factor</th>
<th align="center">Correlation coefficient</th>
<th align="center">Influencing factor</th>
<th align="center">Correlation coefficient</th>
<th align="center">Influencing factor</th>
<th align="center">Correlation coefficient</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Intercept (&#x3b2;<sub>b</sub>)</td>
<td align="char" char=".">&#x2212;0.11216</td>
<td align="left">Lithology (bw<sub>3</sub>)</td>
<td align="char" char=".">&#x2212;3.51706</td>
<td align="left">Land cover (bw<sub>6</sub>)</td>
<td align="char" char=".">&#x2212;0.89108</td>
</tr>
<tr>
<td align="left">Annual average rainfall (bw<sub>1</sub>)</td>
<td align="char" char=".">&#x2212;0.95321</td>
<td align="left">POI kernel density (bw<sub>4</sub>)</td>
<td align="char" char=".">1.57236</td>
<td align="left">Distance from hydrographic net (bw<sub>7</sub>)</td>
<td align="char" char=".">0.20805</td>
</tr>
<tr>
<td align="left">Elevation (bw<sub>2</sub>)</td>
<td align="char" char=".">&#x2212;1.67349</td>
<td align="left">Distance from road (bw<sub>5</sub>)</td>
<td align="char" char=".">&#x2212;1.08721</td>
<td align="left">&#x2014;</td>
<td align="center">&#x2014;</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Finally, the two linear models are shown as follows:<disp-formula id="e7">
<mml:math id="m16">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="normal">Z</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.76293</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2.42323</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.91424</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>2.5956</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.070</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>4</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>3.24346</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>5</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.51187</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>6</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.45871</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>7</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.66213</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>8</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.08878</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>9</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.54395</mml:mn>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mrow>
<mml:mn>10</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>
<disp-formula id="e8">
<mml:math id="m17">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="normal">Z</mml:mi>
<mml:mi mathvariant="normal">b</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.11216</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.95321</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.67349</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>3.51706</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>3</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>1.57236</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>4</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1.08721</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>5</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>0.8910</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>6</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mn>0.208050</mml:mn>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:msub>
<mml:mi mathvariant="normal">w</mml:mi>
<mml:mn>7</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>
</p>
</sec>
</sec>
<sec id="s5-4">
<title>Model Performance and Validation</title>
<p>Any landslide susceptibility assessment will have no scientific significance without validation, so it is necessary to evaluate the validity of the models used. The landslide is prone to a typical binary classification problem, and the confusion matrix can be used to analyze the accuracy further. Instances are divided into positive and negative categories. That is to say, if the sample point is a landslide, it is positive, and if the sample point is a nonlandslide, it is negative. We predicted that four situations will occur in results: 1) an instance status is &#x201c;landslide&#x201d; and also predicted as &#x201c;landslide,&#x201d; recorded as True Positive (TP); 2) &#x201c;nonlandslide&#x201d; but predicted as &#x201c;landslide,&#x201d; recorded as False Positive (FP); 3) an instance status &#x201c;nonlandslide&#x201d; and predicted as &#x201c;nonlandslide,&#x201d; and it is recorded as True Negative (TN); and 4) &#x201c;landslide&#x201d; but predicted as &#x201c;nonlandslide,&#x201d; recorded as False Negative class (FN). Furthermore, we used the &#x201c;OptimalCutoff&#x201d; function of the &#x201c;InformationValue&#x201d; package of R language to find the optimal threshold for partitioning the prediction results of the model. If the predicted value is greater than the threshold, a landslide will occur. Otherwise, the landslide will not&#x20;occur.</p>
<p>Based on the confusion matrix, Receiver Operating Characteristic (ROC) curves and Area Under the Curve (AUC) values are commonly used to comprehensively test and evaluate model accuracy (<xref ref-type="bibr" rid="B53">Naghibi and Moradi Dashtpagerdi, 2016</xref>). When the AUC value is more significant than 0.5 and the closer it is to 1, the higher the accuracy of the model prediction.</p>
</sec>
</sec>
<sec sec-type="results" id="s6">
<title>Results</title>
<sec id="s6-1">
<title>Comparison of Models</title>
<p>The optimal thresholds of LR<sub>ao</sub> and LR<sub>bo</sub> models were very similar, which were 0.534 and 0.592 (<xref ref-type="table" rid="T6">Table&#x20;6</xref>). The accuracy, precision, and recall of the LR<sub>ao</sub> and the LR<sub>bo</sub> were almost the same. The total accuracy of the two models had little difference, which was 0.911 and 0.910, respectively. Nevertheless, the accuracy of landslide and nonlandslide of the LR<sub>ao</sub> model (nonlandslide: 0.914; landslide 0.611) was slightly higher than that of the LR<sub>bo</sub> model (nonlandslide: 0.911; landslide 0.595). The two models had extremely high recall rates for nonlandslide, and the LR<sub>ao</sub> (0.996) is slightly lower than the LR<sub>bo</sub> (0.998). However, for landslides, the recall rate was lower, and the LR<sub>ao</sub> (0.065) was slightly higher than the LR<sub>bo</sub> (0.031). The difference between the two models was insignificant, and both had exceptional reliability.</p>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Confusion matrix between observed and predicted values under optimal threshold conditions for LR<sub>ao</sub> and LR<sub>bo</sub> models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Model</th>
<th rowspan="2" align="center">Threshold</th>
<th rowspan="2" align="left"/>
<th rowspan="2" align="left"/>
<th colspan="2" align="center">Actual value</th>
<th rowspan="2" align="left"/>
</tr>
<tr>
<th align="center">Nonlandslide (0)</th>
<th align="center">Landslide (1)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="3" align="left">LR<sub>ao</sub>
</td>
<td rowspan="3" align="char" char=".">0.534</td>
<td rowspan="3" align="left">Predicted value</td>
<td align="left">Nonlandslide (0)</td>
<td align="center">15,157</td>
<td align="center">1,423</td>
<td align="left">Precision: 0.914</td>
</tr>
<tr>
<td align="left">Landslide (1)</td>
<td align="center">63</td>
<td align="center">99</td>
<td align="left">Precision: 0.611</td>
</tr>
<tr>
<td align="left">&#x2014;</td>
<td align="center">Recall: 0.996</td>
<td align="center">Recall: 0.065</td>
<td align="left">Accuracy: 0.911</td>
</tr>
<tr>
<td rowspan="3" align="left">LR<sub>bo</sub>
</td>
<td rowspan="3" align="char" char=".">0.592</td>
<td rowspan="3" align="left">Predicted value</td>
<td align="left">Nonlandslide (0)</td>
<td align="center">15,188</td>
<td align="center">1,475</td>
<td align="left">Precision: 0.911</td>
</tr>
<tr>
<td align="left">Landslide (1)</td>
<td align="center">32</td>
<td align="center">47</td>
<td align="left">Precision: 0.595</td>
</tr>
<tr>
<td align="left">&#x2014;</td>
<td align="center">Recall: 0.998</td>
<td align="center">Recall: 0.031</td>
<td align="left">Accuracy: 0.910</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The AUC values of the ROC curves of the training dataset of the two models were 0.843 and 0.835, the test dataset were 0.834 and 0.840, and all datasets were 0.842 and 0.835 (<xref ref-type="fig" rid="F5">Figure&#x20;5</xref>), indicating that the LR model before and after optimization in this study both had high reliability and good prediction ability.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>ROC curve of the LR<sub>ao</sub> and the LR<sub>bo</sub> models.</p>
</caption>
<graphic xlink:href="feart-09-713803-g005.tif"/>
</fig>
</sec>
<sec id="s6-2">
<title>Validity of the Optimized Model</title>
<p>Compared with the LR<sub>ao</sub>, the LR<sub>bo</sub> (the optimized model) had absolute stability and high accuracy. So, we applied the LR<sub>bo</sub> to the entire case study area for LSM. Expert empirical methods and dynamic setting threshold methods were used to select the appropriate division-level threshold. The selection of the optimal threshold should minimize the density of historical landslides in the low-susceptibility region and maximize the density of historical landslides in the high-susceptibility region. After repeated trials and errors, five susceptibility levels were finally divided (very-low&#x2013;susceptibility region with <italic>p</italic>&#x20;&#x3c; 0.05 vs. low-susceptibility region with 0.05 &#x2264; P &#x3c; 0.10 vs. moderate-susceptibility region with 0.10 &#x2264; P&#x3c; 0.17 vs. high-susceptibility region with 0.17 &#x2264; P &#x3c; 0.28 vs. very-high&#x2013;susceptibility region with <italic>p</italic>&#x3e;&#x3d;0.28) (<xref ref-type="fig" rid="F6">Figure&#x20;6</xref>). It shows the very-low&#x2013; and low-susceptibility regions were concentrated in the south and southeast of Fengjie County. Meanwhile, the high- and very-high&#x2013;susceptibility regions, which agreed with the geospatial of the historical landslides prone to occurring, were concentrated on both sides of the Yangtze River and its tributaries, mainly in the northern and central parts of Fengjie County.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Landslide susceptibility mapping based on the LR<sub>bo</sub> model vs. the geospatial distribution of historical landslides.</p>
</caption>
<graphic xlink:href="feart-09-713803-g006.tif"/>
</fig>
<p>
<xref ref-type="table" rid="T7">Table&#x20;7</xref> is the statistical result of landslide susceptibility at different levels. The proportion of historical landslides increased gradually with the increase of the susceptibility level, and the density of landslides was positively correlated with the susceptibility level. The area of very-low&#x2013; and low-susceptibility regions accounted for 65.43% of the total area of the study area, while the number of historical landslides only accounted for 23.85% of the total landslides; the area of very-high&#x2013; and high-susceptibility regions accounted for 20.51% of the total area, while the number of historical landslides accounted for 57.42% of the total landslides. This also shows the agreement of the geospatial between the high-susceptibility regions and the historical landslides occurred.</p>
<table-wrap id="T7" position="float">
<label>TABLE 7</label>
<caption>
<p>Statistical results of landslide susceptibility in different levels.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Susceptibility level</th>
<th align="center">Cells number</th>
<th align="center">Area proportion/%</th>
<th align="center">Landslide</th>
<th align="center">Landslide proportion/%</th>
<th align="center">Density proportion</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Very low</td>
<td align="char" char=".">2090557</td>
<td align="char" char=".">46.39</td>
<td align="char" char=".">128</td>
<td align="char" char=".">8.41</td>
<td align="char" char=".">0.07</td>
</tr>
<tr>
<td align="left">Low</td>
<td align="char" char=".">858067</td>
<td align="char" char=".">19.04</td>
<td align="char" char=".">235</td>
<td align="char" char=".">15.44</td>
<td align="char" char=".">0.30</td>
</tr>
<tr>
<td align="left">Moderate</td>
<td align="char" char=".">634007</td>
<td align="char" char=".">14.07</td>
<td align="char" char=".">285</td>
<td align="char" char=".">18.73</td>
<td align="char" char=".">0.50</td>
</tr>
<tr>
<td align="left">High</td>
<td align="char" char=".">470363</td>
<td align="char" char=".">10.44</td>
<td align="char" char=".">351</td>
<td align="char" char=".">23.06</td>
<td align="char" char=".">0.83</td>
</tr>
<tr>
<td align="left">Very high</td>
<td align="char" char=".">453653</td>
<td align="char" char=".">10.07</td>
<td align="char" char=".">523</td>
<td align="char" char=".">34.36</td>
<td align="char" char=".">1.28</td>
</tr>
<tr>
<td align="left">Statistics</td>
<td align="char" char=".">4506647</td>
<td align="char" char=".">100.00</td>
<td align="char" char=".">1,522</td>
<td align="char" char=".">100.00</td>
<td align="center">&#x2014;</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s6-3">
<title>Distribution Characteristics of New Landslide Events</title>
<p>The historical landslide data used in this study were from 2001 to 2016. To verify the LSM results further, we also collected 61 new landslide data in the study area in 2017. All the new landslides were triggered by rainfall, which means that the main factor inducing landslides is rainfall in this study area. The geospatial distribution of the new landslides was overlaid to the LSM (<xref ref-type="fig" rid="F7">Figure&#x20;7</xref>), and Table&#x20;7 shows the details including the location susceptibility level of all the new landslide events. 65% of the new landslide events were located in the high- and very-high&#x2013;susceptibility regions, and 10% were in the moderate-susceptibility region in general. For case study purposes, we analyzed three typical landslides: Qulongxiaoxue landslide, Sujiawan landslide, and Tianjiadawu landslide. Qulongxiaoxue landslide was a medium-sized landslide, which was the largest of all new landslides, covering an affected area of 28.179&#xa0;m<sup>2</sup>. Although the area and volume of the Sujiawan landslide were not significant, the number of people affected and the number of threats were second. Tianjiadawu landslide was a medium-sized landslide that occurred in northwestern Fengjie County in October 2017. These three landslides were located in the high-susceptibility region, indicating that the LSM has a good geospatial agreement with the actual landslide events and the model had a good prediction ability.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Landslide susceptibility mapping based on the LR<sub>bo</sub> model vs. the geospatial distribution of new landslides.</p>
</caption>
<graphic xlink:href="feart-09-713803-g007.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s7">
<title>Discussion</title>
<p>Comparing the results of factor screening of the two models (<xref ref-type="fig" rid="F8">Figure&#x20;8</xref>), there are 10 main factors retained by the LR<sub>ao</sub> model after stepwise regression. However, there are seven main factors retained by the LR<sub>bo</sub> model after GeoDetector and stepwise regression. Through comparative analysis, it is found that the same main factors retained both by the LR<sub>ao</sub> model and the LR<sub>bo</sub> model include elevation, lithology, land cover, distance from roads, and POI kernel density. Among them, elevation and lithology represent the inoculation factors of landslides, which largely determine the stability of local slopes (<xref ref-type="bibr" rid="B31">Sivakumar and Ghosh, 2021</xref>; <xref ref-type="bibr" rid="B37">Tang et&#x20;al., 2021</xref>). In the same way, the materials covered by the ground affect the slope surface, such as runoff and the accumulation of materials on the slope surface. Distance from roads and POI kernel density represent trigger factors caused by human activities. The abovementioned two factors change the natural stress on the originally stable slope, causing cracks inside the slope. Finally, that leads to landslides. Therefore, the dominant factors selected by stepwise regression and GeoDetector are quite reasonable and referential.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Ranking chart of the absolute value of the correlation coefficient of conditioning factors: <bold>(A)</bold> LR<sub>ao</sub> model; <bold>(B)</bold> LR<sub>bo</sub> model.</p>
</caption>
<graphic xlink:href="feart-09-713803-g008.tif"/>
</fig>
<p>In addition to the five common factors in the LR<sub>ao</sub> model, another five main influencing factors are also retained including the degree of relief, slope, TRI, distance from the fault, and CRDS. These factors are all related to the incubation conditions of the landslide and describe the development environment of the landslide itself. While there are still two main conditioning factors that remained in the LR<sub>bo</sub> model except for the five same ones, they are the distance from the hydrographic net and annual average rainfall. In river valleys, high and steep slopes are usually formed under the erosion action of water currents, where the resistance ability of the slopes will be further reduced. Rainfall is one of the factors that cannot be ignored that affects and controls landslides. Throughout the world, judging from the reasons for many landslides (<xref ref-type="bibr" rid="B12">Fan et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B47">Yang et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B40">Van Tien et&#x20;al., 2021a</xref>; <xref ref-type="bibr" rid="B39">Van Tien et&#x20;al., 2021</xref>), the LR<sub>bo</sub> model retains some important trigger factors which are not retained by the LR<sub>ao</sub> model. Although the relationship between landslides and faults cannot be ignored (<xref ref-type="bibr" rid="B41">Wang et&#x20;al., 2021</xref>), most landslides are induced by rainfall in the study area, which does not have a strong relationship with faults. So, it is better not to retain the fault factor. Taken together, the dominant factor retained by the LR<sub>ao</sub> model is not as strong as the explanatory power of the LR<sub>bo</sub> model. The LR<sub>bo</sub> model eliminates unreasonable factors based on the LR<sub>ao</sub> model and retains a more dominant factor.</p>
<p>From the factor screening results of the LR<sub>bo</sub> model, four aspects have an important influence on the landslide, including topography, geological conditions, environmental conditions, and human activities. There are dominant factors in these four aspects, so in future research, these dominant factors can be considered as the research focus, while nondominant factors can be selectively excluded from the factor framework to reduce the workload. Meanwhile, there is an interaction between factors, which may increase or weaken the impact of a single factor on landslides. For example, if a slope is composed of permeable rock and impermeable rock, a water barrier will form naturally, and under the action of rainfall, the probability of landslide will be much higher than that of a slope composed of a single lithology. Therefore, the interaction between factors will be further studied in the follow-up&#x20;work.</p>
</sec>
<sec sec-type="conclusion" id="s8">
<title>Conclusion</title>
<p>In this study, by taking a typical landslide-prone area as an example of application analysis, an optimized LR-based LSM model was proposed by using comprehensive methods of the GeoDetector, stepwise regression, and 10-fold cross validation, which improved the geospatial agreement between landslide susceptibility and actual landslide-prone.<list list-type="simple">
<list-item>
<p>1) The accuracy of the confusion matrix of the two models (LR<sub>ao</sub> and LR<sub>bo</sub>) based on dominant-factor screening and optimal training sample was both more than 0.9. The AUC values of the ROC curves were significantly more than 0.8. The models had great prediction ability and high reliability no matter when tested before or after the screening factor.</p>
</list-item>
<list-item>
<p>2) The LR<sub>bo</sub> model based on the GeoDetector screening factor used only seven dominant factors but achieved the same prediction accuracy as the LR<sub>ao</sub> model constructed with 20 factors. Moreover, the conditioning factors were more reasonable and stable than the LR<sub>ao</sub> model. Based on the optimized LR model, the LSM in this study was in good agreement with the spatial distribution of historical landslides. Most of the new landslides in 2017 were in high-susceptibility regions. All show that the method proposed in this study using the GeoDetector, stepwise regression, and 10-fold cross validation is feasible and reliable.</p>
</list-item>
<list-item>
<p>3) The seven dominant factors, including elevation, lithology, distance from hydrographic net, annual average rainfall, land cover, distance from roads, and POI kernel density, covered four types of conditions of topographical, geological, environmental, and human activities, screened from 22 initial factors by the GeoDetector, indicating that each type has a dominant factor at least, which is more important than other factors of the same&#x20;type.</p>
</list-item>
</list>
</p>
</sec>
</body>
<back>
<sec id="s9">
<title>Data Availability Statement</title>
<p>The raw data supporting the conclusion of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s10">
<title>Author Contributions</title>
<p>This paper represents a result of collaborative teamwork. HW conceived the method, designed and conducted the test and analysis, and reviewed and edited the manuscript; DS wrote the manuscript and conducted the test analysis; and JX and DW wrote the manuscript. YZ and JZ collected data and participated in the analysis. All authors gave final approval for publication.</p>
</sec>
<sec id="s11">
<title>Funding</title>
<p>This work was supported by the National Key Research and Development Program of China (Grant No. 2018YFC1505501) and the Fundamental Research Funds for the Central Universities (Grant No. 2021CDJKYJH036).</p>
</sec>
<sec sec-type="COI-statement" id="s12">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s13" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>The authors would like to express their gratitude to the Chongqing Meteorological Administration, Chongqing Institute of Geology, and Mineral Resources for offering valuable research&#x20;data.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abedi Gheshlaghi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Feizizadeh</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>GIS-Based Ensemble Modelling of Fuzzy System and Bivariate Statistics as a Tool to Improve the Accuracy of Landslide Susceptibility Mapping</article-title>. <source>Nat. Hazards</source> <volume>107</volume>, <fpage>1981</fpage>&#x2013;<lpage>2014</lpage>.</citation>
</ref>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Althuwaynee</surname>
<given-names>O. F.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>H.-J.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.&#x20;H.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>A novel ensemble bivariate statistical evidential belief function with knowledge-based analytical hierarchy process and multivariate statistical logistic regression for landslide susceptibility mapping</article-title>. <source>Catena</source> <volume>114</volume>, <fpage>21</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1016/j.catena.2013.10.011</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ayalew</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yamagishi</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>The application of GIS-based logistic regression for landslide susceptibility mapping in the Kakuda-Yahiko Mountains, Central Japan</article-title>. <source>Geomorphology</source> <volume>65</volume>, <fpage>15</fpage>&#x2013;<lpage>31</lpage>. <pub-id pub-id-type="doi">10.1016/j.geomorph.2004.06.010</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bourenane</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bouhadad</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Guettouche</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Braham</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>GIS-based landslide susceptibility zonation using bivariate statistical and expert approaches in the city of Constantine (Northeast Algeria)</article-title>. <source>Bull. Eng. Geol. Environ.</source> <volume>74</volume>, <fpage>337</fpage>&#x2013;<lpage>355</lpage>. <pub-id pub-id-type="doi">10.1007/s10064-014-0616-6</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Qian</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sheng</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Analysis of Differences in the Spatial Distribution among Terrestrial Mammals Using Geodetector-A Case Study of China</article-title>. <source>Ijgi</source> <volume>10</volume>, <fpage>21</fpage>. <pub-id pub-id-type="doi">10.3390/ijgi10010021</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Rainfall-induced rapid and long-runout catastrophic landslide on July 23, 2019 in Shuicheng, Guizhou, China</article-title>. <source>Landslides</source> <volume>17</volume>, <fpage>2161</fpage>&#x2013;<lpage>2171</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-020-01454-y</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feby</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Achu</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Jimnisha</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Ayisha</surname>
<given-names>V. A.</given-names>
</name>
<name>
<surname>Reghunath</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Landslide susceptibility modelling using integrated evidential belief function based logistic regression method: A study from Southern Western Ghats, India</article-title>. <source>Remote Sensing Appl. Soc. Environ.</source>, <fpage>20</fpage>. </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feizizadeh</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Shadman Roodposhti</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Jankowski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Blaschke</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>A GIS-Based Extended Fuzzy Multi-Criteria Evaluation for Landslide Susceptibility Mapping</article-title>. <source>Comput. Geosci.</source> <volume>73</volume>, <fpage>208</fpage>&#x2013;<lpage>221</lpage>.</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gautam</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kubota</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Sapkota</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Shinohara</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Landslide susceptibility mapping with GIS in high mountain area of Nepal: a comparison of four methods</article-title>. <source>Environ. Earth Sci.</source> <volume>80</volume>, <fpage>359</fpage>&#x2013;<lpage>377</lpage>. <pub-id pub-id-type="doi">10.1007/s12665-021-09650-2</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Naghibi</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Pourghasemi</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>GIS-based landslide spatial modeling in Ganzhou city, China</article-title>. <source>Arab J.&#x20;Geosci.</source> <volume>9</volume> (<issue>2</issue>), <fpage>1</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1007/s12517-015-2094-y</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>S.-H.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Landslide susceptibility prediction based on a semi-supervised multiple-layer perceptron model</article-title>. <source>Landslides</source> <volume>17</volume>, <fpage>2919</fpage>&#x2013;<lpage>2930</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-020-01473-9</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huangfu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Lin</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Landslide Geo-Hazard Risk Mapping Using Logistic Regression Modeling in Guixi, Jiangxi, China</article-title>. <source>Sustainability</source> <volume>13</volume>, <fpage>4830</fpage>. <pub-id pub-id-type="doi">10.3390/su13094830</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kalantar</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Naghibi</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Motevalli</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mansor</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Assessment of the effects of training data selection on the landslide susceptibility mapping: a comparison between support vector machine (SVM), logistic regression (LR) and artificial neural networks (ANN)</article-title>. <source>Geomatics, Nat. Hazards Risk</source> <volume>9</volume> (<issue>1</issue>), <fpage>49</fpage>&#x2013;<lpage>69</lpage>. <pub-id pub-id-type="doi">10.1080/19475705.2017.1407368</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Landslide Susceptibility Prediction Using Particle-Swarm-Optimized Multilayer Perceptron: Comparisons with Multilayer-Perceptron-Only, BP Neural Network, and Information Value Models</article-title>. <source>Appl. Sci.</source> <volume>9</volume>, <fpage>3664</fpage>. <pub-id pub-id-type="doi">10.3390/app9183664</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>C.-C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Innovative landslide susceptibility mapping supported by geomorphon and geographical detector methods</article-title>. <source>Landslides</source> <volume>15</volume>, <fpage>465</fpage>&#x2013;<lpage>474</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-017-0893-9</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Applicability of Two Newmark Models in the Assessment of Coseismic Landslide Hazard and Estimation of Slope-Failure Probability: An Example of the 2008 Wenchuan Mw 7.9 Earthquake Affected Area</article-title>. <source>J.&#x20;Earth Sci.</source> <volume>30</volume>, <fpage>1020</fpage>&#x2013;<lpage>1030</lpage>. <pub-id pub-id-type="doi">10.1007/s12583-019-0874-0</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moore</surname>
<given-names>I. D.</given-names>
</name>
<name>
<surname>Wilson</surname>
<given-names>J.&#x20;P.</given-names>
</name>
</person-group> (<year>1992</year>). <article-title>Length-slope factors for the revised universal soil loss equation: simplified method of estimation</article-title>. <source>J.&#x20;Soil Water Conserv</source> <volume>47</volume> (<issue>5</issue>), <fpage>423</fpage>&#x2013;<lpage>428</lpage>. </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morales</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Lizama</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Somos-Valenzuela</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Lillio</surname>
<given-names>M. F.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A comparative machine learning approach to identify landslide triggering factors in northern Chilean Patagonia</article-title>. <source>Landslides</source> <volume>18</volume>, <fpage>2767</fpage>&#x2013;<lpage>2784</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-021-01675-9</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naemitabar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zanganeh Asadi</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Landslide zonation and assessment of Farizi watershed in northeastern Iran using data mining techniques</article-title>. <source>Nat. Hazards</source> <volume>108</volume>, <fpage>2423</fpage>&#x2013;<lpage>2453</lpage>. <pub-id pub-id-type="doi">10.1007/s11069-021-04805-7</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naghibi</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Dashtpagerdi</surname>
<given-names>M. M.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Evaluation of Four Supervised Learning Methods for Groundwater Spring Potential Mapping in Khalkhal Region (Iran) Using GIS-Based Features</article-title>. <source>Hydrogeol. J.</source> <volume>25</volume> (<issue>1</issue>), <fpage>169</fpage>&#x2013;<lpage>189</lpage>.</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pourghasemi</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Mohammady</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Landslide susceptibility mapping using index of entropy and conditional probability models in GIS: Safarood Basin, Iran</article-title>. <source>Catena</source> <volume>97</volume>, <fpage>71</fpage>&#x2013;<lpage>84</lpage>. <pub-id pub-id-type="doi">10.1016/j.catena.2012.05.005</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reichenbach</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Rossi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Malamud</surname>
<given-names>B. D.</given-names>
</name>
<name>
<surname>Mihir</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Guzzetti</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A review of statistically-based landslide susceptibility models</article-title>. <source>Earth-Science Rev.</source> <volume>180</volume>, <fpage>60</fpage>&#x2013;<lpage>91</lpage>. <pub-id pub-id-type="doi">10.1016/j.earscirev.2018.03.001</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Rapid prediction of landslide dam stability using the logistic regression method</article-title>. <source>Landslides</source> <volume>17</volume>, <fpage>2931</fpage>&#x2013;<lpage>2956</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-020-01414-6</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sivakumar</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ghosh</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Assessment of the influence of physical and seismotectonic parameters on landslide occurrence: an integrated geoinformatic approach</article-title>. <source>Nat. Hazards</source> <volume>108</volume>, <fpage>2765</fpage>&#x2013;<lpage>2811</lpage>. <pub-id pub-id-type="doi">10.1007/s11069-021-04800-y</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soma</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Kubota</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Aditian</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Comparative Study of Land Use Change and Landslide Susceptibility Using Frequency Ratio, Certainty Factor, and Logistic Regression in Upper Area of Ujung-Loe Watersheds South Sulawesi Indonesia</article-title>. <source>Ijece</source> <volume>11</volume>, <fpage>103</fpage>&#x2013;<lpage>115</lpage>. <pub-id pub-id-type="doi">10.13101/ijece.11.103</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021c</year>). <article-title>A hybrid optimization method of factor screening predicated on GeoDetector and Random Forest for Landslide Susceptibility Mapping</article-title>. <source>Geomorphology</source> <volume>379</volume>, <fpage>107623</fpage>. <pub-id pub-id-type="doi">10.1016/j.geomorph.2021.107623</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021b</year>). <article-title>An optimal sample selection-based logistic regression model of slope physical resistance against rainfall-induced landslide</article-title>. <source>Nat. Hazards</source> <volume>105</volume> (<issue>2</issue>), <fpage>1255</fpage>&#x2013;<lpage>1279</lpage>. <pub-id pub-id-type="doi">10.1007/s11069-020-04353-6</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2021a</year>). <article-title>Assessment of landslide susceptibility mapping based on Bayesian hyperparameter optimization: A comparison between logistic regression and random forest</article-title>. <source>Eng. Geology.</source> <volume>281</volume> (<issue>2021</issue>), <fpage>105972</fpage>. <pub-id pub-id-type="doi">10.1016/j.enggeo.2020.105972</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>R.-X.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>E.-C.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>X.-M.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Comparison of Logistic Regression, Information Value, and Comprehensive Evaluating Model for Landslide Susceptibility Mapping</article-title>. <source>Sustainability</source> <volume>13</volume>, <fpage>3803</fpage>. <pub-id pub-id-type="doi">10.3390/su13073803</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tsangaratos</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ilia</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Applying information theory and GIS-based quantitative methods to produce landslide susceptibility maps in Nancheng County, China</article-title>. <source>Landslides</source> <volume>14</volume>, <fpage>1091</fpage>&#x2013;<lpage>1111</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-016-0769-4</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Tien</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Luong</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Duc</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Trinh</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Quynh</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Lan</surname>
<given-names>N. C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Rainfall-induced catastrophic landslide in Quang Tri Province: the deadliest single landslide event in Vietnam in 2020</article-title>. <source>Landslides</source> <volume>18</volume>, <fpage>2323</fpage>&#x2013;<lpage>2327</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-021-01664-y</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van Tien</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Trinh</surname>
<given-names>P. T.</given-names>
</name>
<name>
<surname>Luong</surname>
<given-names>L. H.</given-names>
</name>
<name>
<surname>Nhat</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Duc</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Hieu</surname>
<given-names>T. T.</given-names>
</name>
<etal/>
</person-group> (<year>2021a</year>). <article-title>The October 13, 2020, deadly rapid landslide triggered by heavy rainfall in Phong Dien, Thua Thien Hue, Vietnam</article-title>. <source>Landslides</source> <volume>18</volume>, <fpage>2329</fpage>&#x2013;<lpage>2333</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-021-01663-z</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hao</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Assessment of landslide susceptibility and risk factors in China</article-title>. <source>Nat. Hazards</source> <volume>108</volume>, <fpage>3045</fpage>&#x2013;<lpage>3059</lpage>. <pub-id pub-id-type="doi">10.1007/s11069-021-04812-8</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.&#x20;F.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X. H.</given-names>
</name>
<name>
<surname>Christakos</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>Y. L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2010</year>). <article-title>Geographical Detectors&#x2010;Based Health Risk Assessment and its Application in the Neural Tube Defects Study of the Heshun Region, China</article-title>. <source>Int. J.&#x20;Geographical Inf. Sci.</source> <volume>24</volume> (<issue>1</issue>), <fpage>107</fpage>&#x2013;<lpage>127</lpage>. <pub-id pub-id-type="doi">10.1080/13658810802443457</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wubalem</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Landslide susceptibility mapping using statistical methods in Uatzau catchment area, northwestern Ethiopia</article-title>. <source>Geoenvironmental Disasters</source> <volume>8</volume>. <pub-id pub-id-type="doi">10.1186/s40677-020-00170-y</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xie</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Baise</surname>
<given-names>L. G.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Application and comparison of Logistic regression model and Neural network model in earthquake-induced landslides susceptibility mapping at mountainous region, China</article-title>. <source>Geomatics, Nat. Hazards Risk</source> <volume>9</volume> (<issue>1</issue>), <fpage>501</fpage>&#x2013;<lpage>523</lpage>. <pub-id pub-id-type="doi">10.1080/19475705.2018.1451399</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xie</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Jian</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Robledo</surname>
<given-names>L. F.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>A Novel Hybrid Method for Landslide Susceptibility Mapping-Based GeoDetector and Machine Learning Cluster: A Case of Xiaojin County, China</article-title>. <source>Ijgi</source> <volume>10</volume>, <fpage>93</fpage>. <pub-id pub-id-type="doi">10.3390/ijgi10020093</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Rainfall-induced landslides and debris flows in Mengdong Town, Yunnan Province, China</article-title>. <source>Landslides</source> <volume>17</volume>, <fpage>931</fpage>&#x2013;<lpage>941</lpage>. <pub-id pub-id-type="doi">10.1007/s10346-019-01336-y</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yilmaz</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>A case study from Koyulhisar (Sivas-Turkey) for landslide susceptibility mapping by artificial neural networks</article-title>. <source>Bull. Eng. Geol. Environ.</source> <volume>68</volume> (<issue>3</issue>), <fpage>297</fpage>&#x2013;<lpage>306</lpage>. <pub-id pub-id-type="doi">10.1007/s10064-009-0185-2</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Z. Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Slope Unit-Based Landslide Susceptibility Mapping Using Certainty Factor, Support Vector Machine, Random Forest, CF-SVM and CF-RF Models</article-title>. <source>Front. Earth Sci.</source> <volume>9</volume>. <pub-id pub-id-type="doi">10.3389/feart.2021.589630</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Landslide susceptibility mapping using hybrid random forest with GeoDetector and RFE for factor optimization</article-title>. <source>Geosci. Front.</source> <volume>12</volume> (<issue>5</issue>), <fpage>101211</fpage>. <pub-id pub-id-type="doi">10.1016/j.gsf.2021.101211</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>