<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1131954</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2023.1131954</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Environmental Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Urban waterlogging prediction and risk analysis based on rainfall time series features: A case study of Shenzhen</article-title>
<alt-title alt-title-type="left-running-head">Zhang et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fenvs.2023.1131954">10.3389/fenvs.2023.1131954</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Zhang</surname>
<given-names>Zongjia</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2125616/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jian</surname>
<given-names>Xinyao</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2159544/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Yiye</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Huang</surname>
<given-names>Zhejun</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Liu</surname>
<given-names>Junguo</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/947771/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Yang</surname>
<given-names>Lili</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>School of Environment</institution>, <institution>Harbin Institute of Technology</institution>, <addr-line>Harbin</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Statistics and Data Science</institution>, <institution>Southern University of Science and Technology</institution>, <addr-line>Shenzhen</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>School of Environmental Science and Engineering</institution>, <institution>Southern University of Science and Technology</institution>, <addr-line>Shenzhen</addr-line>, <country>China</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Henan Provincial Key Laboratory of Hydrosphere and Watershed Water Security</institution>, <institution>North China University of Water Resources and Electric Power</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1425601/overview">Huiyu Dong</ext-link>, Chinese Academy of Sciences (CAS), China</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2218766/overview">Konstantinos Nikolopoulos</ext-link>, Durham University, United Kingdom</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1987392/overview">Jiabo Yin</ext-link>, Wuhan University, China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Lili Yang, <email>yangll@sustech.edu.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>13</day>
<month>04</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>11</volume>
<elocation-id>1131954</elocation-id>
<history>
<date date-type="received">
<day>26</day>
<month>12</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>04</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Zhang, Jian, Chen, Huang, Liu and Yang.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Zhang, Jian, Chen, Huang, Liu and Yang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>In recent years, the frequency of extreme weather has increased, and urban waterlogging caused by sudden rainfall has occurred from time to time. With the development of urbanization, a large amount of land has been developed and the proportion of impervious area has increased, intensifying the risk of urban waterlogging. How to use the available meteorological data for accurate prediction and early warning of waterlogging hazards has become a key issue in the field of disaster prevention and risk assessment. In this paper, based on historical meteorological data, we combine domain knowledge and model parameters to experimentally extract rainfall time series related features for future waterlogging depth prediction. A novel waterlogging depth prediction model that applies only rainfall data as input is proposed by machine learning algorithms. By analyzing a large amount of historical flooding monitoring data, a &#x201c;rainfall-waterlogging amplification factor&#x201d; based on the geographical features of monitoring stations is constructed to quantify the mapping relationship between rainfall and waterlogging depths at different locations. After the model is trained and corrected by the measured data, the prediction error for short-time rainfall basically reaches within 2&#xa0;cm. This method improves prediction performance by a factor of 2.5&#x2013;3 over featureless time series methods. It effectively overcomes the limitations of small coverage of monitoring stations and insufficient historical waterlogging data, and can achieve more accurate short-term waterlogging prediction. At the same time, it can provide reference suggestions for the government to conduct waterlogging risk analysis and add new sensor stations by counting the amplification factor of other locations.</p>
</abstract>
<kwd-group>
<kwd>urban waterlogging</kwd>
<kwd>time series</kwd>
<kwd>risk assessment</kwd>
<kwd>machine learning</kwd>
<kwd>rainfall</kwd>
<kwd>Shenzhen</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content>
</contract-sponsor>
<contract-sponsor id="cn003">Shenzhen Science and Technology Innovation Program<named-content content-type="fundref-id">10.13039/501100017610</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Influenced by global climate change, the frequency and scale of extreme weather events have been on the rise in recent years, and urban flooding disasters caused by extreme weather events such as typhoons and short-lived heavy rainstorms have been increasing (<xref ref-type="bibr" rid="B8">Ferreira et al., 2015</xref>; <xref ref-type="bibr" rid="B39">Zhang et al., 2017</xref>). The intensity of extreme precipitation in most regions of the world shows a trend towards intensification and a concentration of rainfall events (<xref ref-type="bibr" rid="B36">Yin et al., 2022</xref>). Yin used simulations from a large climate&#x2013;hydrology model ensemble of 111 members, their results provide crucial insights towards assessing and mitigating adverse effects of compound hazards on ecosystems and human wellbeing (<xref ref-type="bibr" rid="B35">Yin et al., 2023</xref>). Urbanization increases hardened area, reduces infiltration, increases runoff and triggers higher and faster peak water flow (<xref ref-type="bibr" rid="B20">Nayeb Yazdi et al., 2019</xref>; <xref ref-type="bibr" rid="B24">Sofia et al., 2019</xref>). It has reduced groundwater recharge from natural infiltration and has contributed to the high runoff (<xref ref-type="bibr" rid="B19">Nath et al., 2021</xref>). A large number of low-lying areas prone to flooding are incorporated into urban development plans, and the lack of drainage capacity further exacerbates the risk of flooding (<xref ref-type="bibr" rid="B6">Du et al., 2012</xref>). With increasing impervious cover in urban areas driving dramatic changes in rainfall infiltration and storage capacity, which lead that urban flood appear sudden and frequent (<xref ref-type="bibr" rid="B18">Mu et al., 2020</xref>).</p>
<p>Waterlogging events on a global scale may have a serious and direct impact on the economy and humanitarianism, as well as continue to adversely affect economic development (<xref ref-type="bibr" rid="B1">Arshad et al., 2019</xref>). Globally, the occurrence of urban floods has been unprecedented resulting in huge economic and social losses (<xref ref-type="bibr" rid="B25">Sundaram et al., 2021</xref>). In July 2021, the rainstorm in Zhengzhou, China caused 380 deaths and a direct economic loss of 120.06 billion yuan. Urban flood disaster has become a crucial problem restricting the healthy development of China&#x2019;s economy and society (<xref ref-type="bibr" rid="B7">Duan et al., 2022</xref>; <xref ref-type="bibr" rid="B13">Li et al., 2022</xref>). Urban floods can cause huge economic losses and casualties, and countries all over the world attach great importance to urban flood warning and mitigation. Therefore, obtaining timely and highly accurate waterlogging depth information with wide coverage is urgently needed for emergency response and risk mitigation, especially using an affordable, accurate, and widespread approach (<xref ref-type="bibr" rid="B4">Deo and Wen, 2016</xref>). Nowadays, more and more researchers have started to pay attention to urban waterlogging (<xref ref-type="bibr" rid="B37">Yin et al., 2015</xref>). Among them, accurate prediction of inland flooding is a hot research problem in the field. For accurate prediction and warning of the extent and depth of internal flooding, there are mainly numerical simulation methods, hydrological methods, and data-driven methods.</p>
<p>Numerical simulation method. Based on the principles of hydrodynamics, the model uses the underlying surface and elevation factors comprehensively in waterlogging process; it performs the whole process of city waterlogging formation in detail. Its simulation results are waterlogging distribution and waterlogging depth maps of a certain time step (<xref ref-type="bibr" rid="B31">Xue et al., 2016</xref>). Numerical simulation methods allow easy estimation of waterlogging under each recurrence period rainfall. It is interesting to note that under different urbanization and rainfall scenarios, the urban waterlogging susceptibility has a considerable variation (Explicit the urban waterlogging spatial variation and its driving factors: The stepwise cluster analysis model and hierarchical partitioning analysis approach). The hydrological and hydrodynamic model couples the distributed hydrological model and two-dimensional hydrodynamic model, which not only ensures the accuracy of the model but also has good calculation efficiency. It is a promising research direction for the flood model (<xref ref-type="bibr" rid="B15">Liu et al., 2022a</xref>). On the other hand, it also shortens waterlogging simulation time, and finally improves the applicability of waterlogging simulation (<xref ref-type="bibr" rid="B42">Zounemat-Kermani et al., 2020</xref>). But the disadvantage is that small number of data mining model parameters, such as the obscure physical implications of model parameters and the insufficient amount of simulation training, the simulation is prone to the problem of different arguments (<xref ref-type="bibr" rid="B26">Tang et al., 2021</xref>). Furthermore, the computational efficiency of numerical models is too low to meet the requirements of urban emergency management. Thus, many coupled methods of numerical simulation and other methods such as machine learning have emerged. A new method was established by combining a long short-term memory neural network model with a numerical model, which can quickly predict the waterlogging depth. The principle is to train the long and short-term memory neural network to predict and simulate the internal flooding process by using the numerical simulation results as training samples (<xref ref-type="bibr" rid="B15">Liu et al., 2022a</xref>). However, the disadvantage of this method is that the accuracy of LSTM results is extremely dependent on the results of previous numerical simulation. If the error of numerical simulation results is large, the results are difficult to guarantee.</p>
<p>In recent years, with the application of water sensor, many cities have established urban waterlogging monitoring and early warning system. But water level sensors are expensive and cannot be deployed all over the city (<xref ref-type="bibr" rid="B17">Loftis et al., 2018</xref>). Moreover, the simple monitoring data can only reflect the real-time depth of water accumulation, which does not have robust forecasting function (<xref ref-type="bibr" rid="B16">Liu et al., 2022b</xref>). As more and more water level sensors acquire large amounts of historical waterlogging data, some studies are beginning to train models based on historical real waterlogging data, or to use coupled models to improve the performance of prediction methods. The most representative of these is the data-driven method based on time series. Ding et al. proposed an explicable spatiotemporal attention long&#x2014;short memory model (STA-LSTM) based on LSTM and attention mechanism, and established the model using dynamic attention mechanism and LSTM method to make explicable analysis of flood prediction (<xref ref-type="bibr" rid="B5">Ding et al., 2020</xref>). Yan et al. proposed a prediction model of the maximum water depth in time and space employing a neural network-numerical simulation model on the basis of coupling a two-dimensional hydrological and hydrodynamic model and a statistical analysis model. But due to data limitations, the actual rainfall and waterlogging data were not added to the database for training. Therefore, although the performance of the prediction model is satisfactory, its accuracy can be improved further after collecting enough data (<xref ref-type="bibr" rid="B33">Yan et al., 2021</xref>). Wu et al. established a real-time prediction model of flood depth based on waterlogging point by using GBDT algorithm based on multi-factor analysis and verified the validity and applicability of the model for real-time prediction of waterlogging process. However, the model that Wu used only be predicted when rainfall occurs, and cannot predict the flood depth after rainfall (<xref ref-type="bibr" rid="B30">Wu et al., 2020a</xref>).</p>
<p>However, some recent studies have shown that the prediction performance of a single method or model is always limited. Accounting for model structure, parameter and input forcing uncertainty in flood inundation modeling using Bayesian model averaging. The combination of multiple models can effectively improve the prediction performance. Multi-model combination methods to deal with model uncertainty and improve model performance (<xref ref-type="bibr" rid="B32">Yan and Hamid, 2016</xref>). Zhou et al. proposed an extreme flood information estimation method considering the uncertainty of distribution and model structure using the BMA method. They construct a comprehensive prediction model by BMA and three machine learning methods (support vector machines (SVM), Back Propagation Neural Network (BPNN) and Adaptive Boosting (AdaBoost)) use rainfall forecast data to drive BMA model for fine early warning of urban flood. The analysis of early warning in two different urban flood events indicates that BMA is more suitable for the prediction of severe waterlogging and illustrates the great potential and prospects of BMA in urban flood early warning (<xref ref-type="bibr" rid="B41">Zhou et al., 2022</xref>). Naive Bayes (NB) and Random Forest (RF) algorithm were used to forecast the waterlogging point and the waterlogging process at the waterlogging point respectively to achieve the goal of predicting the whole process of urban waterlogging (<xref ref-type="bibr" rid="B28">Wang et al., 2021</xref>). Historical flooding events and the value of flood contributing factors are used as inputs for the model. These input data are converted to raster layers with help of GIS tools. Our dependent variable would be a one-hot encoded vector stating whether or not it was flooded with those conditions (<xref ref-type="bibr" rid="B12">Khatri et al., 2022</xref>). The stochastic forest (RF), Logistic model tree (LMT) and other bivariate models combined with data mining tools can be used to simulate flood susceptibility. The study found that the LMT has good predictive power, so the model can be used for future flood mitigation in specific areas (<xref ref-type="bibr" rid="B23">Shahabi et al., 2020</xref>). Data warehouse and deep learning algorithm were used to assess urban flood risk. The GBDT model shows 88.48% accuracy in the depth of water accumulation prediction (<xref ref-type="bibr" rid="B29">Wu et al., 2020b</xref>). An application of data-driven models using artificial neural network was presented, support vector regression and long-short term memory approaches and distributed forcing data for runoff predictions. The results showed that the long-short term memory and support vector regression models outperforms artificial neural network model for hourly runoff forecasting, and the predictive performance of the models was greater during the wet seasons compared to the dry seasons (<xref ref-type="bibr" rid="B10">Han and Morrison, 2021</xref>). Puttinaovarat and Horkaew proposed a novel flood forecasting system based on fusing meteorological, hydrological, geospatial, and crowdsource big data in an adaptive machine learning framework (<xref ref-type="bibr" rid="B21">Puttinaovarat and Horkaew, 2020</xref>).</p>
<p>Existing studies have not sufficiently analyzed rainfall time series. Combined with waterlogging sensor data, more accurate predictions of waterlogging depths can be obtained with an accuracy of centimeters or even millimeters. The input condition used in this paper is rainfall data, which is free from the limitation of waterlogging sensors. The transfer of the model prediction capability can be achieved at locations where the features are similar to the sensor points.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methodology</title>
<sec id="s2-1">
<title>2.1 Framework</title>
<p>This study follows this framework (<xref ref-type="fig" rid="F1">Figure 1</xref>) by selecting features for training from the original rainfall time series using domain knowledge, VIF verification and parameter correction. After sliding window slicing and processing the data, the input-output matrix is constructed and the waterlogging prediction is performed by using machine learning regressors. Geographic features around the station are extracted from the geographic information, their influence on the amplification factor is analyzed, and this is used to regional waterlogging risk analysis.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The framework of the method.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g001.tif"/>
</fig>
</sec>
<sec id="s2-2">
<title>2.2 Data processing</title>
<p>In this paper, the historical rainfall dataset and the waterlogging depth dataset are used to predict the future waterlogging depth. The amplification factor is established by characterization of geographic feature data. Data processing is divided into five main steps: 1) Data cleaning. Considering the possible sensor failure or low sensor sensitivity, the initial screening of valid stations is done according to the number of valid data in the cumulative flooding dataset. 2) Construction of uniform structured data. Uniform start and end time nodes, the different total working hours of different sensors lead to inconsistent start and end dates of collected data, here by truncating and artificially adding 0 nodes, so that the data sets of different stations can keep the same length. 3) Resampling. Considering the different working mechanisms of different sensors, their sampling intervals are not consistent, here the resampling function of Python is used to unify the sampling interval for subsequent model training. 4) Data interpolation. Use data interpolation to fill in the missing values in the data after resampling to make the time series continuous and in line with reality. 5) Sliding window slicing and data integration. According to the structural requirements of the training model and the prediction strategy, the time series are segmented by sliding windows, reconstructed with the extracted time series features, and the data are integrated into the model.</p>
</sec>
<sec id="s2-3">
<title>2.3 Model feature construction</title>
<sec id="s2-3-1">
<title>2.3.1 Time series feature extraction and construction</title>
<p>In order to extract more valuable information for the model from the time series, this paper uses statistical methods and domain knowledge to extract and construct new feature vectors to improve the model prediction performance.</p>
<sec id="s2-3-1-1">
<title>2.3.1.1 Unit rainfall</title>
<p>The rainfall data in this paper are sliding rainfall, which can reflect the total amount of rainfall in the previous period but lack direct description of the rainfall in the current period, which will lose the rainfall intensity information. The current rainfall intensity will largely affect the subsequent waterlogging. Therefore, an iterative algorithm is used here to calculate the unit rainfall (UR) from the sliding rainfall Eq. <xref ref-type="disp-formula" rid="e1">1</xref>.<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mi mathvariant="bold-italic">t</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mn mathvariant="bold">01</mml:mn>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
<mml:mi mathvariant="bold-italic">t</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mn mathvariant="bold">01</mml:mn>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3c4;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mn mathvariant="bold">01</mml:mn>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">2</mml:mn>
<mml:mi mathvariant="bold-italic">&#x3c4;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mn mathvariant="bold">01</mml:mn>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">3</mml:mn>
<mml:mi mathvariant="bold-italic">&#x3c4;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mn mathvariant="bold">01</mml:mn>
<mml:mi mathvariant="bold-italic">H</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">t</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">&#x3c4;</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mi mathvariant="bold-italic">U</mml:mi>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">t</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:msub>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:msub>
<mml:mi mathvariant="bold-italic">t</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msub>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>where <inline-formula id="inf1">
<mml:math id="m2">
<mml:mrow>
<mml:mi mathvariant="normal">&#x3c4;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is 1&#xa0;h, t is the current time, UR is the cumulated rainfall during time period [<inline-formula id="inf2">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>]</p>
</sec>
<sec id="s2-3-1-2">
<title>2.3.1.2 Seasonality coefficient.</title>
<p>In addition to the amount of rainfall, the ability of the ground surface to form waterlogging is mainly influenced by the runoff coefficient. The runoff coefficient is mainly related to the type of land cover, slope, soil aridity and infiltration capacity. The process of runoff generation is also influenced by multiple factors such as latitude, climate zone, monsoon, and season (<xref ref-type="bibr" rid="B27">Tarasova et al., 2018</xref>). Differences in air humidity, air pressure, and temperature brought about by seasonal changes will directly affect the water content in the air and soil. During the dry season, the water content in the soil is low, rainfall is easily absorbed by the soil, and the intensity of rainfall is relatively low during the dry season, resulting in less occurrence of waterlogging (<xref ref-type="bibr" rid="B2">Burak et al., 2020</xref>). During the rainy season, the water content in the soil is high and even nearly saturated in some areas (e.g., seasonal wetlands). Rainfall is not easily absorbed by the soil, and the rainfall intensity is relatively high and transient during the rainy season, leading to relatively easy waterlogging (<xref ref-type="bibr" rid="B38">Zavala et al., 2008</xref>). Therefore, the seasonality coefficient S is defined and the dry months (MD), rainy months (MR) and transition months (MT) are determined based on the multi-year monthly average rainfall statistics (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Seasonal factor of the month to which the event belongs.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Indicators</th>
<th align="left">MR</th>
<th align="left">MT</th>
<th align="left">MD</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">R_Mean</td>
<td align="left">R<sub>1</sub>
</td>
<td align="left">R<sub>2</sub>
</td>
<td align="left">R<sub>3</sub>
</td>
</tr>
<tr>
<td align="left">S</td>
<td align="left">lg10</td>
<td align="left">lg6</td>
<td align="left">lg2</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-3-1-3">
<title>2.3.1.3 Correlation features related to rainfall interval.</title>
<p>The period between rainfall events affects the infiltration capacity and runoff coefficient. When two rainfall events are separated by a long interval, the water content in the soil or surface is already at a low level due to sufficient infiltration and evaporation. In contrast, when the water content between two rainfall events is high, surface runoff is more likely to form and thus converge to produce waterlogging when the rainfall occurs again (<xref ref-type="bibr" rid="B22">Ran et al., 2012</xref>). In this paper, we define the rainfall interval <inline-formula id="inf3">
<mml:math id="m4">
<mml:mrow>
<mml:mi>&#x3b4;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, which is the interval between the beginning of this rainfall period and the end of the previous rainfall period (h). We define the wetting coefficient <inline-formula id="inf4">
<mml:math id="m5">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>w</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> as Eq. <xref ref-type="disp-formula" rid="e2">2</xref> (<xref ref-type="bibr" rid="B40">Zhang et al., 2023</xref>), which is the ratio between the mean value of rainfall of this rainfall event and the rainfall interval &#x3b4;, representing the wetting capacity of this rainfall on the land. Horton infiltration curves are commonly used in the field of hydrology to model the rate variation of fluid infiltration in different surfaces. The Horton infiltration equation (<xref ref-type="bibr" rid="B34">Yang et al., 2020</xref>) is <inline-formula id="inf5">
<mml:math id="m6">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>k</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula id="inf6">
<mml:math id="m7">
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the infiltration rate, <inline-formula id="inf7">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>c</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the stable infiltration rate, <inline-formula id="inf8">
<mml:math id="m9">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the initial infiltration rate, <inline-formula id="inf9">
<mml:math id="m10">
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the time, and <inline-formula id="inf10">
<mml:math id="m11">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is an empirical constant related to soil properties. Considering that the surface differences of monitoring stations are not significant, the function <inline-formula id="inf11">
<mml:math id="m12">
<mml:mrow>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:math>
</inline-formula> is introduced as the basis function, and the integrated infiltration capacity <inline-formula id="inf12">
<mml:math id="m13">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is fitted from the rainfall curve time series curve as Eq. <xref ref-type="disp-formula" rid="e3">3</xref>.<disp-formula id="e2">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mi mathvariant="bold-italic">w</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">m</mml:mi>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mi mathvariant="bold-italic">a</mml:mi>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3b4;</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
<disp-formula id="e3">
<mml:math id="m15">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">C</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold">lg</mml:mi>
<mml:mo>&#x2061;</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3b4;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:msup>
<mml:msub>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mi mathvariant="bold-italic">max</mml:mi>
</mml:msub>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="bold">ln</mml:mi>
<mml:mo>&#x2061;</mml:mo>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mfenced open="|" close="|" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">&#x3b1;</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
<mml:mi mathvariant="bold-italic">L</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>where <inline-formula id="inf13">
<mml:math id="m16">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the mean rainfall (mm), <inline-formula id="inf14">
<mml:math id="m17">
<mml:mrow>
<mml:mi>&#x3b4;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the rainfall interval (h); <inline-formula id="inf15">
<mml:math id="m18">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">max</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the maximum value of rainfall in this segment (mm); <inline-formula id="inf16">
<mml:math id="m19">
<mml:mrow>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the slope of each point of the rainfall event sequence curve; and <inline-formula id="inf17">
<mml:math id="m20">
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is the length of rainfall events.</p>
</sec>
<sec id="s2-3-1-4">
<title>2.3.1.4 Statistical features</title>
<p>The rainfall time series itself contains many features in its statistics. The mean value <inline-formula id="inf18">
<mml:math id="m21">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and the maximum value <inline-formula id="inf19">
<mml:math id="m22">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mi mathvariant="italic">max</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> reflect the scale of rainfall and are important indicators of the amount of rainfall. The standard deviation <inline-formula id="inf20">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> reflects whether the rainfall is evenly distributed in time and is useful for identifying sudden and severe rainfall. The total rainfall is not large, but due to the high instantaneous intensity, it is also easy to trigger waterlogging (<xref ref-type="bibr" rid="B3">David et al., 2013</xref>). The kurtosis can determine whether the rainfall curve is gentle or steep. Skewness can screen whether the peak intensity of rainfall comes from the first half or the second half of the rainfall curve. AUC is the area under the rainfall curve and can represent the total amount of rainfall.</p>
</sec>
</sec>
<sec id="s2-3-2">
<title>2.3.2 Feature filtering</title>
<p>The statistical features extracted from the rainfall time series and the features constructed based on domain knowledge together form the feature set. However, sometimes some features may not correlate well with the model mechanism and do not have good predictive ability and may even negatively affect the model. By filtering the features through domain knowledge, model experiments and VIF validation, we can remove the insignificant features and thus improve the accuracy of the model. It can also reduce the computational cost and improve the interpretability of the model (<xref ref-type="bibr" rid="B11">Khalid et al., 2014</xref>).</p>
</sec>
</sec>
<sec id="s2-4">
<title>2.4 Constructing model input and output matrices</title>
<p>A uniform rainfall slice length <inline-formula id="inf21">
<mml:math id="m24">
<mml:mrow>
<mml:mi>l</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is selected, and the number of slice bars within each rainfall event of irregular length (serial number <inline-formula id="inf22">
<mml:math id="m25">
<mml:mrow>
<mml:mi>k</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, total length <inline-formula id="inf23">
<mml:math id="m26">
<mml:mrow>
<mml:msub>
<mml:mi>L</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>) can be denoted as <inline-formula id="inf24">
<mml:math id="m27">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf25">
<mml:math id="m28">
<mml:mrow>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> is calculated by Eq. <xref ref-type="disp-formula" rid="e4">4</xref>. The rainfall events are iteratively sliced according to a fixed sliding window length (<xref ref-type="fig" rid="F2">Figure 2</xref>).<disp-formula id="e4">
<mml:math id="m29">
<mml:mrow>
<mml:mi mathvariant="bold-italic">n</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">L</mml:mi>
<mml:mi mathvariant="bold-italic">k</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold-italic">l</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Schematic diagram of data slicing and integration.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g002.tif"/>
</fig>
<p>The rainfall input vector <inline-formula id="inf26">
<mml:math id="m30">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> within each event can be expressed as Eq. <xref ref-type="disp-formula" rid="e5">5</xref>
<disp-formula id="e5">
<mml:math id="m31">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">l</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mi mathvariant="bold-italic">l</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>
</p>
<p>The rainfall time series feature vector <inline-formula id="inf27">
<mml:math id="m32">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> within each event can be expressed as Eq. <xref ref-type="disp-formula" rid="e6">6</xref>, with each slice having a feature vector length of <inline-formula id="inf28">
<mml:math id="m33">
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula>. Unlike <inline-formula id="inf29">
<mml:math id="m34">
<mml:mrow>
<mml:msub>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, to characterize the cumulative effect of rainfall, each <inline-formula id="inf30">
<mml:math id="m35">
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is calculated from the data between the beginning of the rainfall event in that segment and the end of the slice in this segment.<disp-formula id="e6">
<mml:math id="m36">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2002;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">m</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2002;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mi mathvariant="bold-italic">m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>
</p>
<p>The single input vector of the model can be expressed as Eq. <xref ref-type="disp-formula" rid="e7">7</xref>.<disp-formula id="e7">
<mml:math id="m37">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mi mathvariant="bold-italic">l</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2009;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mtext>&#x2002;</mml:mtext>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mn mathvariant="bold">4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:mo>&#x22ef;</mml:mo>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mi mathvariant="bold-italic">m</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>
</p>
<p>The combined input matrix X can be expressed as Eq. <xref ref-type="disp-formula" rid="e8">8</xref>, and the output matrix as Eq. <xref ref-type="disp-formula" rid="e9">9</xref>. The input-output relationship in regression model can be expressed as Eq. <xref ref-type="disp-formula" rid="e10">10</xref>.<disp-formula id="e8">
<mml:math id="m38">
<mml:mrow>
<mml:mi mathvariant="bold-italic">X</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mo>&#x2026;</mml:mo>
</mml:mtd>
<mml:mtd>
<mml:mo>&#x2026;</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mtd>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">f</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>
<disp-formula id="e9">
<mml:math id="m39">
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mfenced open="[" close="]" separators="|">
<mml:mrow>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mo>&#x22ee;</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:mtable columnalign="center">
<mml:mtr>
<mml:mtd>
<mml:mo>&#x22ee;</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(9)</label>
</disp-formula>
<disp-formula id="e10">
<mml:math id="m40">
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="bold">&#x3c6;</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="bold-italic">X</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(10)</label>
</disp-formula>
</p>
</sec>
<sec id="s2-5">
<title>2.5 Model training and validation</title>
<p>After processing the data, the model is trained and tested in the ratio of 70% and 30% of the training and test sets. The testing was carried out by random sampling method. Samples were imported into the regression model. The optimal parameters, including slice length, number of features, feature combination method and prediction strategy, are determined by testing. The performance of several machine learning algorithms is compared to obtain the optimal model configuration.</p>
</sec>
<sec id="s2-6">
<title>2.6 Geographical feature statistics and risk analysis</title>
<p>Through multi-source data analysis of meteorology, waterlogging, topography and municipality, the geographical features including topography terrain, land cover type and drainage network distribution within 500&#xa0;m diameter of the station are integrated. The amplification factor (AF) between rainfall and waterlogging depth is calculated from historical data, and the risk of waterlogging in the area is also analyzed according to the amplification factor; the larger the AF, the higher the possibility of generating deeper waterlogging.</p>
</sec>
</sec>
<sec id="s3">
<title>3 Case study</title>
<sec id="s3-1">
<title>3.1 Study area</title>
<p>Shenzhen is one of the core cities of the Guangdong-Hong Kong-Macao Greater Bay Area. Over the past 40&#xa0;years, Shenzhen&#x2019;s GDP has grown rapidly from 270 million yuan in 1980 to 2,767.02 billion yuan in 2021. The annual average rainfall is 1935.8&#xa0;mm, and the time distribution shows that the rainfall is mainly concentrated in April to September, with a spatial trend of decreasing rainfall from the southeast to the northwest. Typhoons and rainstorms are the most frequently occurring hazards in Shenzhen (<xref ref-type="bibr" rid="B9">Gong et al., 2022</xref>). Shenzhen is prone to frequent short-duration rainstorms, which often result in severe waterlogging in the city and, sometimes, can even cause casualties (<xref ref-type="bibr" rid="B14">Liu et al., 2020</xref>). Shenzhen City had an extreme rainstorm on 11 April 2019, resulting in an internal waterlogging event that killed 11 people in the city. Therefore, it is important to be able to predict and warn the occurrence of waterlogging disasters in advance to protect the safety of citizens as well as to improve the disaster prevention and mitigation capacity of the city. <xref ref-type="fig" rid="F3">Figure 3</xref> shows the location of Shenzhen and the area involved in the study, and <xref ref-type="table" rid="T2">Table 2</xref> shows the data used for the case.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Study area of Shenzhen, China.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g003.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Data description and sources.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Item</th>
<th align="left">Data description</th>
<th align="left">Data source</th>
<th align="left">Resolution</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Historical waterlogging sensor data</td>
<td align="left">Waterlogging sensor monitoring data. (January 2019 to December 2020)</td>
<td align="left">Water Bureau of Shenzhen Municipality (WBSM)</td>
<td align="left">0.01&#xa0;m</td>
</tr>
<tr>
<td align="left">Historical meteorological station data</td>
<td align="left">Meteorological basic observation data of rainfall, wind speed, visibility, temperature and humidity at all stations in the city. (January 2019 to December 2020)</td>
<td align="left">Shenzhen Meteorological Bureau (SMB)</td>
<td align="left">5&#xa0;min</td>
</tr>
<tr>
<td align="left">Digital elevation model (DEM)</td>
<td align="left">Realize digital simulation of ground terrain through limited terrain elevation data</td>
<td align="left">BIGEMAP</td>
<td align="left">5m&#x2a;5m</td>
</tr>
<tr>
<td align="left">Land cover type</td>
<td align="left">Current status of all land use in the city, including construction land, broad-leaved forest land, coniferous forest land, water bodies, wetlands, etc.</td>
<td align="left">Global Fine Land cover product (GLC_FCS30-2019). Academy of Aerospace Information Innovation, Chinese Academy of Sciences</td>
<td align="left">30&#x2a;30&#xa0;m</td>
</tr>
<tr>
<td align="left">Drainage system</td>
<td align="left">Rainwater outlet vector file, including location, orifice size, orifice shape</td>
<td align="left">Water bureau of Shenzhen Municipality (WBSM)</td>
<td align="left">0.001&#xa0;m</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="results" id="s4">
<title>4 Results</title>
<p>The paper conducted experiments on four monitoring stations. As shown in <xref ref-type="table" rid="T3">Table 3</xref>, in the comparison of the three algorithms, Random Forest (RF) has the smallest MSE except at station D, where RF has a slightly larger MSE than Gradient Boosting Decision Tree (GBDT), indicating that RF is better adapted to this prediction task.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Comparison of machine learning algorithms.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Station</th>
<th colspan="3" align="center">MSE of algorithm</th>
</tr>
<tr>
<th align="left"/>
<th align="left">Adaboost</th>
<th align="left">GBDT</th>
<th align="left">RF</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">A</td>
<td align="left">0.006976</td>
<td align="left">0.000409</td>
<td align="left">
<bold>0.000089</bold>
</td>
</tr>
<tr>
<td align="left">B</td>
<td align="left">0.000071</td>
<td align="left">0.000042</td>
<td align="left">
<bold>0.000022</bold>
</td>
</tr>
<tr>
<td align="left">C</td>
<td align="left">0.000440</td>
<td align="left">0.000302</td>
<td align="left">
<bold>0.000254</bold>
</td>
</tr>
<tr>
<td align="left">D</td>
<td align="left">0.003706</td>
<td align="left">
<bold>0.000190</bold>
</td>
<td align="left">0.000238</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The bold represents the result of the optimal algorithm for each station.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Compared to direct prediction using the original time series, the method of adding extracted features achieves a larger improvement at all four stations (<xref ref-type="table" rid="T4">Table 4</xref>). It indicates that using features for training can improve the prediction ability of the model to a greater extent.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Comparison of results of methods with and without features.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Station</th>
<th align="left">With feature</th>
<th align="left">Without feature</th>
<th align="left">Performance improvement (%)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">A</td>
<td align="left">0.000089</td>
<td align="left">0.000617</td>
<td align="left">697.2</td>
</tr>
<tr>
<td align="left">B</td>
<td align="left">0.000022</td>
<td align="left">0.000053</td>
<td align="left">238.5</td>
</tr>
<tr>
<td align="left">C</td>
<td align="left">0.000254</td>
<td align="left">0.000754</td>
<td align="left">297.0</td>
</tr>
<tr>
<td align="left">D</td>
<td align="left">0.000238</td>
<td align="left">0.000728</td>
<td align="left">306.3</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>As shown in <xref ref-type="fig" rid="F4">Figure 4</xref>, the constructed and extracted features possess different weights, and with the algorithmic feature visualization function, we conclude. The <inline-formula id="inf31">
<mml:math id="m41">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula>, <inline-formula id="inf32">
<mml:math id="m42">
<mml:mrow>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>w</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> and <inline-formula id="inf33">
<mml:math id="m43">
<mml:mrow>
<mml:msub>
<mml:mi>R</mml:mi>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> of rainfall are the three most important features. In fact, these three features correspond to the magnitude, variability and temporal characteristics of rainfall, respectively.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>The weight value of 9 features in the model.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g004.tif"/>
</fig>
<p>After the configuration combination experiments, the configuration with the best results was finally selected as follows: when selecting the original rainfall data, it is better to use the 1-h sliding rainfall, which can enhance the fine waterlogging prediction. Of the total number of features constructed and extracted, 9 feature combinations were determined to balance computational efficiency and prediction accuracy (<italic>rain dry, rain month, rain min, rain AUC</italic> and <italic>rain cum</italic> were removed). Nine features did not overfit on 4 stations, proving that our feature construction makes sense. The experimental results of the three algorithms were compared, and the RF algorithm had superior robustness.</p>
<p>In <xref ref-type="fig" rid="F5">Figure 5</xref>, the blue curve is the rainfall and the orange curve is the waterlogging depth, and it can be seen that there is a strong correlation between the two. <xref ref-type="fig" rid="F6">Figure 6</xref> shows the predicted and true values of the waterlogging depth, and it can be seen that the model can predict the change trend well, with an average error within 2&#xa0;cm. Prediction model evaluation for four stations can be seen in <xref ref-type="table" rid="T5">Table 5</xref>.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Rainfall and waterlogging curves for events in four stations. <bold>(A)</bold> station A event: 143; <bold>(B)</bold> station A event: 220; <bold>(C)</bold> station B event: 105; <bold>(D)</bold> station B event: 191; <bold>(E)</bold> station C event: 244; <bold>(F)</bold> station D event: 98.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g005.tif"/>
</fig>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Predicted depth of waterlogging at four stations. <bold>(A)</bold> station A event: 143; <bold>(B)</bold> station A event: 220; <bold>(C)</bold> station B event: 105; <bold>(D)</bold> station B event: 191; <bold>(E)</bold> station C event: 244; <bold>(F)</bold> station D event: 98.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g006.tif"/>
</fig>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Prediction model evaluation for four stations.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Station</th>
<th align="left">MSE</th>
<th align="left">MAE</th>
<th align="left">
<italic>R</italic>
<sup>2</sup> score</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">A</td>
<td align="left">0.00007</td>
<td align="left">0.01083</td>
<td align="left">0.95341</td>
</tr>
<tr>
<td align="left">B</td>
<td align="left">0.00001</td>
<td align="left">0.00049</td>
<td align="left">0.88907</td>
</tr>
<tr>
<td align="left">C</td>
<td align="left">0.00011</td>
<td align="left">0.00091</td>
<td align="left">0.92823</td>
</tr>
<tr>
<td align="left">D</td>
<td align="left">0.00006</td>
<td align="left">0.00042</td>
<td align="left">0.97167</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec sec-type="discussion" id="s5">
<title>5 Discussion</title>
<p>
<list list-type="simple">
<list-item>
<p>1) The method in this paper has a smaller MSE and more accurate prediction results than the results obtained by directly using the original rainfall event series. The model enhances the performance and robustness by time series feature extraction. Better prediction results are achieved by adjusting the feature parameters when the model is not over-fitted.</p>
</list-item>
<list-item>
<p>2) <xref ref-type="fig" rid="F7">Figure 7</xref> shows the ratio of rainfall (m) to waterlogging depth (m) for each of the four stations in each slice of the waterlogging event, which we define here as the Amplification factor. Because the number of waterlogging events at each station is different from the length of time, the amount of data at station A is much larger than that at stations C and D. The curves reflect the vulnerability of each station to rainfall mitigation capacity in terms of waterlogging events. The AF of station A is generally larger, indicating that station A is more likely to form deeper water under the same rainfall event. The AF of station D is generally smaller, indicating its better ability to withstand waterlogging hazards. As seen in <xref ref-type="table" rid="T6">Table 6</xref>
<bold>.</bold> Statistical results of geographical characteristics of the four stations., station A has the least drainage outlet area in the area and the drainage volume is at a lower level. As seen in <xref ref-type="fig" rid="F8">Figure 8</xref>, the topography of station A is the flattest among the four stations (<xref ref-type="table" rid="T6">Table 6</xref>, variance of DEM is only 3.91), and the central terrain of the area is in a significant depression, so its is more likely to form standing water. In terms of the number of waterlogging events, station A also has the most, reaching 13.7 times that of station D.</p>
</list-item>
<list-item>
<p>3) The results of flow cumulative values extracted from the topographic data can reflect the runoff direction and flow results. From <xref ref-type="table" rid="T6">Table 6</xref>, the combined regional flow cumulative value of station A reaches 2,151,063, and it can be seen from <xref ref-type="fig" rid="F9">Figure 9</xref> that the area of station A contains a flow vector with a larger cumulative value. The combined factors mentioned in 1) constitute the result of a larger AF at station A.</p>
</list-item>
<list-item>
<p>4) Station D has the best comprehensive drainage capacity among the four stations. With other geographical features similar to B, the total waterlogging time at station D is only 24.63% of that at station B. This indicates that the better the regional drainage facilities, the lower the risk of waterlogging.</p>
</list-item>
<list-item>
<p>5) It can be seen from <xref ref-type="fig" rid="F8">Figure 8</xref> that all four waterlogging monitoring stations are set up in the more low-lying areas of the region. It indicates that the setting of monitoring stations is generally oriented to the occurrence of waterlogging hazards, and the priority of construction is higher in places with high frequency of occurrence. The results of this study on geographic features can be used to find areas with similar geographic features and thus provide reference for the additional waterlogging monitoring stations.</p>
</list-item>
<list-item>
<p>6) The four selected waterlogging monitoring stations are all in urban built-up areas, and the land cover type is impervious surface. This type of land surface possesses a runoff coefficient of about 0.95&#x2013;1, so the infiltration capacity of rainfall is weak. If the percentage of impervious surface on the surrounding ground is high, it will further increase the risk of waterlogging formation.</p>
</list-item>
<list-item>
<p>7) The proportion of waterlogging events in the total events is low, which can affect the prediction effect of the model. By selecting a sample of waterlogging events in advance, the positive sample weights are enhanced through stratified sampling and data balancing, which can improve the model prediction ability and reduce errors.</p>
</list-item>
</list>
</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Results of amplification factors for the four stations.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g007.tif"/>
</fig>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Statistical results of geographical characteristics of the four stations.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Station</th>
<th align="center">DEM (m)</th>
<th align="center">D_min (m)</th>
<th align="center">D_max (m)</th>
<th align="center">D_std</th>
<th align="center">Land cover</th>
<th align="center">Sum_flow</th>
<th align="center">Dra_A (m<sup>2</sup>)</th>
<th align="center">Dra_V (m<sup>3</sup>)</th>
<th align="center">Number of waterlogging slices</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">A</td>
<td align="center">33</td>
<td align="center">21</td>
<td align="center">43</td>
<td align="center">
<bold>
<italic>3.91</italic>
</bold>
</td>
<td align="center">IS</td>
<td align="center">
<bold>2151063</bold>
</td>
<td align="center">
<bold>
<italic>145.46</italic>
</bold>
</td>
<td align="center">
<bold>
<italic>7,210.38</italic>
</bold>
</td>
<td align="center">
<bold>2,437</bold>
</td>
</tr>
<tr>
<td align="center">B</td>
<td align="center">18</td>
<td align="center">&#x2212;3</td>
<td align="center">90</td>
<td align="center">13.71</td>
<td align="center">IS</td>
<td align="center">4,047.50</td>
<td align="center">236.93</td>
<td align="center">9,448.44</td>
<td align="center">1419</td>
</tr>
<tr>
<td align="center">C</td>
<td align="center">
<bold>
<italic>5</italic>
</bold>
</td>
<td align="center">&#x2212;8</td>
<td align="center">72</td>
<td align="center">13.33</td>
<td align="center">IS</td>
<td align="center">
<bold>
<italic>1192.20</italic>
</bold>
</td>
<td align="center">198.45</td>
<td align="center">
<bold>14,863.07</bold>
</td>
<td align="center">751</td>
</tr>
<tr>
<td align="center">D</td>
<td align="center">11</td>
<td align="center">&#x2212;15</td>
<td align="center">41</td>
<td align="center">8.28</td>
<td align="center">IS</td>
<td align="center">10,600.46</td>
<td align="center">
<bold>335.14</bold>
</td>
<td align="center">11,961.56</td>
<td align="center">
<bold>
<italic>185</italic>
</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>IS, Impermeable surface; Dra_A, Drainage area; Dra_V, Drainage volume.</p>
</fn>
<fn>
<p>&#x2a;Bold represents larger values, italic represents smaller values.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Topography within a 500&#xa0;m radius of stations. <bold>(A)</bold> Station A; <bold>(B)</bold> station B; <bold>(C)</bold> station C; <bold>(D)</bold> station <bold>(D)</bold>. Blue represents higher elevation values and red represents lower elevation values. The middle circles represent the zones of 50, 100, 150&#xa0;m from the station. (The terrain is stretched, with a stretch factor of 3).</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g008.tif"/>
</fig>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Cumulative value of flow in the area of station A.</p>
</caption>
<graphic xlink:href="fenvs-11-1131954-g009.tif"/>
</fig>
</sec>
<sec sec-type="conclusion" id="s6">
<title>6 Conclusion</title>
<p>Short-term prediction of waterlogging has been a hot issue for research, because earlier warning can reduce casualties and property damage from disasters. Due to the Markovian character of itself, future waterlogging can be predicted using the waterlogging of previous periods. However, how to use rainfall data to predict waterlogging where there are no sensors becomes an urgent problem. In this study, a time-series machine learning model using feature extraction for rainfall events significantly improves the prediction with an average error of less than 2&#xa0;cm. The nine features extracted are validated and proved to be really beneficial and reasonable for model capability improvement. Combined with future rainfall forecast information, it is possible to calculate whether waterlogging will form at a point in the short-term future time period. Based on the prediction results, the government can dispatch rescue forces or block the relevant roads in advance. It provides a reliable basis for government emergency decision-making and risk analysis.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/supplementary materials, further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s8">
<title>Author contributions</title>
<p>ZZ and LY contributed to conception and design of the study. ZZ and YC organized the database. ZZ, XJ, and YC performed the statistical analysis. ZZ and XJ completed the code compilation and method. ZH and JL revised the manuscript. LY and JL managed the implementation of the research activities and reviewed the manuscript All authors contributed to manuscript revision, read, and approved the submitted version.</p>
</sec>
<sec id="s9">
<title>Funding</title>
<p>This research was funded by National Key R&#x26;D Program of China (2018YFC0807000), Natural Science Foundation of China (71771113), National Key R&#x26;D Program of China (2019YFC0810705), Shenzhen Scientific Research Funding (Grant No. K22627501), and Shenzhen Science and Technology Plan platform and carrier special (Grant So. ZDSYS20210623092007023). It was also partly supported by the Shenzhen Science and Technology Program (KCXFZ20201221173601003) and the Henan Provincial Key Laboratory of Hydrosphere and Watershed Water Security.</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arshad</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ogie</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Barthelemy</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Pradhan</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Verstaevel</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Perez</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Computer vision and IoT-based sensors in flood monitoring and mapping: A systematic review</article-title>. <source>Sensors (Basel)</source> <volume>19</volume> (<issue>22</issue>), <fpage>5012</fpage>. <pub-id pub-id-type="doi">10.3390/s19225012</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Burak</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bilge</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>&#xdc;lker</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Computation of monthly runoff coefficients for Istanbul</article-title>. <source>Therm. Sci.</source> <volume>25</volume>, <fpage>1561</fpage>&#x2013;<lpage>1572</lpage>. <pub-id pub-id-type="doi">10.2298/TSCI191102147B</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>David</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Alpert</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Messer</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>The potential of cellular network infrastructures for sudden rainfall monitoring in dry climate regions</article-title>. <source>Atmos. Res.</source> <volume>131</volume>, <fpage>13</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1016/j.atmosres.2013.01.004</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Deo</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Qi</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>A wavelet-coupled support vector machine model for forecasting global incident solar radiation using limited meteorological dataset</article-title>. <source>Appl. Energy</source> <volume>168</volume>, <fpage>568</fpage>&#x2013;<lpage>593</lpage>. <pub-id pub-id-type="doi">10.1016/j.apenergy.2016.01.130</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ding</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Interpretable spatio-temporal attention LSTM model for flood forecasting</article-title>. <source>Neurocomputing</source> <volume>403</volume>, <fpage>348</fpage>&#x2013;<lpage>359</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2020.04.110</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Du</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Analysis of dry/wet conditions using the standardized precipitation index and its potential usefulness for drought/flood monitoring in Hunan Province, China</article-title>. <source>Stoch. Environ. Res. Risk Assess.</source> <volume>27</volume>, <fpage>377</fpage>&#x2013;<lpage>387</lpage>. <pub-id pub-id-type="doi">10.1007/s00477-012-0589-6</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Duan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huawei</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>The 20 july 2021 major flood event&#x201d; in greater Zhengzhou, China: A case study of flooding severity and landscape characteristics</article-title>. <source>Land</source> <volume>11</volume>, <fpage>1921</fpage>. <pub-id pub-id-type="doi">10.3390/land11111921</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferreira</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Walsh</surname>
<given-names>R. P. D.</given-names>
</name>
<name>
<surname>Shakesby</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Keizer</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Soares</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>gonzalez-pelayo</surname>
<given-names>O.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Differences in overland flow, hydrophobicity and soil moisture dynamics between Mediterranean woodland types in a peri-urban catchment in Portugal</article-title>. <source>J. Hydrology</source> <volume>533</volume>, <fpage>473</fpage>&#x2013;<lpage>485</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2015.12.040</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gong</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Dynamic risk assessment of compound hazards based on VFS&#x2013;IEM&#x2013;IDM: A case study of typhoon&#x2013;rainstorm hazards in shenzhen, China</article-title>. <source>Nat. Hazards Earth Syst. Sci.</source> <volume>22</volume>, <fpage>3271</fpage>&#x2013;<lpage>3283</lpage>. <pub-id pub-id-type="doi">10.5194/nhess-22-3271-2022</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Han</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Morrison</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Data-driven approaches for runoff prediction using distributed data</article-title>. <source>Stoch. Environ. Res. Risk Assess.</source> <volume>36</volume>, <fpage>2153</fpage>&#x2013;<lpage>2171</lpage>. <pub-id pub-id-type="doi">10.1007/s00477-021-01993-3</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Khalid</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shehryar</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Nasreen</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2014</year>). &#x201c;<article-title>A survey of feature selection and feature extraction techniques in machine learning</article-title>,&#x201d; in <conf-name>Proceedings of the 2014 science and information conference</conf-name>, <conf-loc>London, UK</conf-loc>, <conf-date>August 2014</conf-date>.</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Khatri</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kokane</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Pawar</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Prediction of waterlogged zones under heavy rainfall conditions using machine learning and GIS tools: A case study of Mumbai</article-title>. <source>GeoJournal</source> <volume>87</volume>, <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1007/s10708-022-10731-3</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cui</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Evaluation of comprehensive emergency capacity to urban flood disaster: An example from Zhengzhou city in henan province, China</article-title>. <source>Sustainability</source> <volume>14</volume>, <fpage>13710</fpage>. <pub-id pub-id-type="doi">10.3390/su142113710</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chan</surname>
<given-names>P. W.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Dynamic spatial-temporal precipitation distribution models for short-duration rainstorms in Shenzhen, China based on machine learning</article-title>. <source>Atmos. Res.</source> <volume>237</volume>, <fpage>104861</fpage>. <pub-id pub-id-type="doi">10.1016/j.atmosres.2020.104861</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yesen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zheng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chai</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2022a</year>). <article-title>Intelligent prediction method for waterlogging risk based on AI and numerical model</article-title>. <source>Water</source> <volume>14</volume>, <fpage>2282</fpage>. <pub-id pub-id-type="doi">10.3390/w14152282</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Song</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2022b</year>). <article-title>An effective rainfall&#x2013;ponding multi-step prediction model based on LSTM for urban waterlogging points</article-title>. <source>Appl. Sci.</source> <volume>12</volume>, <fpage>12334</fpage>. <pub-id pub-id-type="doi">10.3390/app122312334</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Loftis</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Forrest</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Katragadda</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Spencer</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Organski</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>StormSense: A new integrated network of IoT water level sensors in the smart cities of hampton roads, va</article-title>. <source>Mar. Technol. Soc. J.</source> <volume>52</volume>, <fpage>56</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.4031/MTSJ.52.2.7</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lyu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Huo</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Duan</surname>
<given-names>W.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Impact of temporal rainfall patterns on flash floods in Hue City, Vietnam</article-title>. <source>J. Flood Risk Manag.</source> <volume>14</volume>. <pub-id pub-id-type="doi">10.1111/jfr3.12668</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nath</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ni-Meister</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Choudhury</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Impact of urbanization on land use and land cover change in Guwahati city, India and its implication on declining groundwater level</article-title>. <source>Groundw. Sustain. Dev.</source> <volume>12</volume>, <fpage>100500</fpage>. <pub-id pub-id-type="doi">10.1016/j.gsd.2020.100500</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nayeb Yazdi</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ketabchy</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sample</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Scott</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>An evaluation of HSPF and SWMM for simulating streamflow regimes in an urban watershed</article-title>. <source>Environ. Model. Softw.</source> <volume>118</volume>, <fpage>211</fpage>&#x2013;<lpage>225</lpage>. <pub-id pub-id-type="doi">10.1016/j.envsoft.2019.05.008</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Puttinaovarat</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Horkaew</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Flood forecasting system based on integrated big and crowdsource data by using machine learning techniques</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>5885</fpage>&#x2013;<lpage>5905</lpage>. <pub-id pub-id-type="doi">10.1109/access.2019.2963819</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ran</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Experimental study of the impact of rainfall characteristics on runoff generation and soil erosion</article-title>. <source>J. Hydrology</source> <volume>424</volume>, <fpage>99</fpage>&#x2013;<lpage>111</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2011.12.035</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shahabi</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Shirzadi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ghaderi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Omidvar</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Al-Ansari</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Clague</surname>
<given-names>J. J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Flood detection and susceptibility mapping using sentinel-1 remote sensing data and a machine learning approach: Hybrid intelligence of bagging ensemble based on K-nearest neighbor classifier</article-title>. <source>Remote Sens.</source> <volume>12</volume> (<issue>2</issue>), <fpage>266</fpage>. <pub-id pub-id-type="doi">10.3390/rs12020266</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sofia</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Ragazzi</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Giandon</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Dalla Fontana</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Tarolli</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>On the linkage between runoff generation, land drainage, soil properties, and temporal patterns of precipitation in agricultural floodplains</article-title>. <source>Adv. Water Resour.</source> <volume>124</volume>, <fpage>120</fpage>&#x2013;<lpage>138</lpage>. <pub-id pub-id-type="doi">10.1016/j.advwatres.2018.12.003</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sundaram</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Devaraj</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Yarrakula</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Modeling, mapping and analysis of urban floods in India-a review on geospatial methodologies</article-title>. <source>Environ. Sci. Pollut. Res.</source> <volume>28</volume>, <fpage>67940</fpage>&#x2013;<lpage>67956</lpage>. <pub-id pub-id-type="doi">10.1007/s11356-021-16747-5</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A method to increase the number of positive samples for machine learning-based urban waterlogging susceptibility assessments</article-title>. <source>Stoch. Environ. Res. Risk Assess.</source> <volume>36</volume>, <fpage>1</fpage>&#x2013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1007/s00477-021-02035-8</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tarasova</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Basso</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zink</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Merz</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Exploring controls on rainfall-runoff events: 1. Time series-based event separation and temporal dynamics of event runoff response in Germany</article-title>. <source>Water Resour. Res.</source> <volume>54</volume> (<issue>10</issue>), <fpage>7711</fpage>&#x2013;<lpage>7732</lpage>. <pub-id pub-id-type="doi">10.1029/2018WR022587</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Prediction of urban water accumulation points and water accumulation process based on machine learning</article-title>. <source>Earth Sci. Inf.</source> <volume>14</volume>, <fpage>2317</fpage>&#x2013;<lpage>2328</lpage>. <pub-id pub-id-type="doi">10.1007/s12145-021-00700-8</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>Depth prediction of urban flood under different rainfall return periods based on deep learning and data warehouse</article-title>. <source>Sci. Total Environ.</source> <volume>716</volume>, <fpage>137077</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2020.137077</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020a</year>). <article-title>Real-time prediction of the water accumulation process of urban stormy accumulation points based on deep learning</article-title>. <source>IEEE Access</source> <volume>8</volume>, <fpage>1</fpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3017277</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xue</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Numerical simulation of urban waterlogging based on FloodArea model</article-title>. <source>Adv. Meteorology</source> <volume>2016</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1155/2016/3940707</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hamid</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Toward more robust extreme flood prediction by bayesian hierarchical and multimodeling</article-title>. <source>Nat. Hazards</source> <volume>81</volume>, <fpage>203</fpage>&#x2013;<lpage>225</lpage>. <pub-id pub-id-type="doi">10.1007/s11069-015-2070-6</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A rapid prediction model of urban flood inundation in a high-risk area coupling machine learning and numerical simulation approaches</article-title>. <source>Int. J. Disaster Risk Sci.</source> <volume>12</volume>, <fpage>903</fpage>&#x2013;<lpage>918</lpage>. <pub-id pub-id-type="doi">10.1007/s13753-021-00384-0</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Improving the Horton infiltration equation by considering soil moisture variation</article-title>. <source>J. Hydrology</source> <volume>586</volume>, <fpage>124864</fpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2020.124864</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gentine</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Slater</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Pokhrel</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hanasaki</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Future socio-ecosystem productivity threatened by compound drought&#x2013;heatwave events</article-title>. <source>Nat. Sustain.</source> <volume>6</volume>, <fpage>259</fpage>&#x2013;<lpage>272</lpage>. <pub-id pub-id-type="doi">10.1038/s41893-022-01024-1</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Thermodynamic driving mechanisms for the formation of global precipitation extremes and ecohydrological effects</article-title>. <source>Sci. China Earth Sci.</source> <volume>66</volume>, <fpage>92</fpage>&#x2013;<lpage>110</lpage>. <pub-id pub-id-type="doi">10.1007/s11430-022-9987-0</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ye</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yin</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A review of advances in urban flood risk analysis over China</article-title>. <source>Stoch. Environ. Res. Risk Assess.</source> <volume>29</volume>, <fpage>1063</fpage>&#x2013;<lpage>1070</lpage>. <pub-id pub-id-type="doi">10.1007/s00477-014-0939-7</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zavala</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Jord&#xe1;n</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bellinfante</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Seasonal variability of runoff and soil loss on forest road backslopes under simulated rainfall</article-title>. <source>Catena</source> <volume>74</volume>, <fpage>73</fpage>&#x2013;<lpage>79</lpage>. <pub-id pub-id-type="doi">10.1016/j.catena.2008.03.006</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Assessing the impact of climate change on the waterlogging risk in coastal cities: A case study of guangzhou, south China</article-title>. <source>J. Hydrometeorol.</source> <volume>18</volume>, <fpage>1549</fpage>&#x2013;<lpage>1562</lpage>. <pub-id pub-id-type="doi">10.1175/JHM-D-16-0157.1</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zeng</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Multi-source data fusion and hydrodynamics for urban waterlogging risk identification</article-title>. <source>Int. J. Environ. Res. Public Health</source> <volume>20</volume> (<issue>3</issue>), <fpage>2528</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph20032528</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhou</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Prediction and early warning method of inundation process at waterlogging points based on Bayesian model average and data-driven</article-title>. <source>J. Hydrology Regional Stud.</source> <volume>44</volume>, <fpage>101248</fpage>. <pub-id pub-id-type="doi">10.1016/j.ejrh.2022.101248</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zounemat-Kermani</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Matta</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Cominola</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Hinkelmann</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Neurocomputing in surface water hydrology and hydraulics: A review of two decades retrospective, current status and future prospects</article-title>. <source>J. Hydrology</source> <volume>588</volume>, <fpage>125085</fpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2020.125085</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>