<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Environ. Sci.</journal-id>
<journal-title>Frontiers in Environmental Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Environ. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-665X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">917545</article-id>
<article-id pub-id-type="doi">10.3389/fenvs.2022.917545</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Environmental Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Boosted Regression Tree Algorithm for the Reconstruction of GRACE-Based Terrestrial Water Storage Anomalies in the Yangtze River Basin</article-title>
<alt-title alt-title-type="left-running-head">Dannouf et al.</alt-title>
<alt-title alt-title-type="right-running-head">On the Reconstruction of GRACE-TWSA Using BRT</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Dannouf</surname>
<given-names>Ramia</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1766374/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yong</surname>
<given-names>Bin</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Ndehedehe</surname>
<given-names>Christopher E.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/796799/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Correa</surname>
<given-names>Fabio M.</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1890114/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Ferreira</surname>
<given-names>Vagner</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1313807/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>State Key Laboratory of Hydrology-Water Resources and Hydraulic Engineering</institution>, <institution>Hohai University</institution>, <addr-line>Nanjing</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>School of Earth Sciences and Engineering</institution>, <institution>Hohai University</institution>, <addr-line>Nanjing</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Australian Rivers Institute</institution>, <institution>Griffith University</institution>, <addr-line>Nathan</addr-line>, <addr-line>QLD</addr-line>, <country>Australia</country>
</aff>
<aff id="aff4">
<sup>4</sup>
<institution>Griffith School of Environment and Science</institution>, <institution>Griffith University</institution>, <addr-line>Nathan</addr-line>, <addr-line>QLD</addr-line>, <country>Australia</country>
</aff>
<aff id="aff5">
<sup>5</sup>
<institution>Department of Statistics</institution>, <institution>Rhodes University</institution>, <addr-line>Grahamstown</addr-line>, <country>South Africa</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/558346/overview">Susana Barbosa</ext-link>, University of Porto, Portugal</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1773749/overview">Guillaume Ramillien</ext-link>, UMR5563 G&#xe9;osciences Environnement Toulouse (GET), France</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1053587/overview">Ziyan Zheng</ext-link>, Institute of Atmospheric Physics (CAS), China</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Vagner Ferreira, <email>vagnergf@hhu.edu.cn</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Environmental Informatics and Remote Sensing, a section of the journal Frontiers in Environmental Science</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>12</day>
<month>07</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>10</volume>
<elocation-id>917545</elocation-id>
<history>
<date date-type="received">
<day>11</day>
<month>04</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>07</day>
<month>06</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Dannouf, Yong, Ndehedehe, Correa and Ferreira.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Dannouf, Yong, Ndehedehe, Correa and Ferreira</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>The terrestrial water storage anomaly (TWSA) from the previous Gravity Recovery and Climate Experiment (GRACE) covers a relatively short period (15 years) with several missing periods. This study explores the boosted regression trees (BRT) and the artificial neural network (ANN) to reconstruct the TWSA series between 1982 and 2014 over the Yangtze River basin (YRB). Both algorithms are trained with several hydro-climatic variables (e.g., precipitation, soil moisture, and temperature) and climate indices for the YRB. The results from this study show that the BRT is capable of reconstructing TWSA and shows Nash&#x2013;Sutcliffe efficiency (NSE) of 0.89 and a root-mean-square error (RMSE) of 18.94&#xa0;mm during the test stage, outperforming ANN in about 2.3% and 7.4%, respectively. As a step further, the reliability of this technique in reconstructing TWSA beyond the GRACE era was also evaluated. Hence, a closed-loop simulation using the artificial TWSA series over 1982&#x2013;2014 under the same scenarios for the actual GRACE data shows that BRT can predict TWSA (NSE of 0.92 and RMSE of 6.93&#xa0;mm). Again, the BRT outperformed the ANN by approximately 1.1% and 5.3%, respectively. This study provides a new perspective for reconstructing and filling the gaps in the GRACE&#x2013;TWSA series over data-scarce regions, which is desired for hydrological drought characterization and environmental studies. BRT offers such an opportunity for the GRACE Follow-On mission to predict 11&#xa0;months of missing TWSA data by relying on a limited number of predictive variables, hence being adjudged to be more economical than the ANN.</p>
</abstract>
<kwd-group>
<kwd>artificial neural network</kwd>
<kwd>boosted regression trees</kwd>
<kwd>GRACE</kwd>
<kwd>machine learning</kwd>
<kwd>terrestrial water storage anomaly</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Key Research and Development Program of China<named-content content-type="fundref-id">10.13039/501100012166</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>The terrestrial water storage anomaly (TWSA) from the observations of the preceding Gravity Recovery and Climate Experiment (GRACE) and the contemporary follow-one (GRACE-FO) missions is the sum of the water stored as snow/ice, surface waters, soil moisture, groundwater, and biomass. It is assumed to be concentrated on a virtual layer of water thickness at the Earth&#x2019;s surface (<xref ref-type="bibr" rid="B17">Ferreira et al., 2020b</xref>). TWSA is a critical component of the hydrologic cycle, and thus, an instrumental dataset that underpins our understanding of water availability on different spatial scales and how its variability is affected by climate change and anthropogenic activities. Consequently, the monthly fields of TWSA have been used globally in hydrological studies to provide essential outcomes such as identifying key drivers of land water storage across the globe (<xref ref-type="bibr" rid="B45">Rodell et al., 2018</xref>). For example, a GRACE hydrological assessment over North India, as was undertaken by <xref ref-type="bibr" rid="B44">Rodell et al. (2009)</xref>, highlighted the unsustainable consumption of groundwater for irrigation and other anthropogenic uses. While this assessment was revisited by <xref ref-type="bibr" rid="B29">Long et al. (2016)</xref>, the combined impacts of climate variability and human water management on freshwater stocks across several continents have been detailed (see, e.g., <xref ref-type="bibr" rid="B2">Ahmed et al., 2014</xref>; <xref ref-type="bibr" rid="B37">Ndehedehe and Ferreira, 2020</xref>). Also notable is the work of <xref ref-type="bibr" rid="B41">Reager et al. (2014)</xref>, who investigated the suitability of GRACE observations to infer the flood potential of various river basins at a lead time of several months. Indeed, GRACE applications are varied and transdisciplinary. This includes the possibility of estimating the evapotranspiration (<xref ref-type="bibr" rid="B42">Rodell et al., 2004a</xref>), river discharge (<xref ref-type="bibr" rid="B52">Syed et al., 2005</xref>) over data-poor regions, estimating water mass changes over permafrost regions (<xref ref-type="bibr" rid="B53">Velicogna et al., 2012</xref>), and data assimilations to improve the outputs of hydrological models (<xref ref-type="bibr" rid="B60">Zaitchik et al., 2008</xref>). Despite the importance of the TWSA datasets retrieved from the GRACE mission in hydrological studies, the relatively short period of approximately 20&#xa0;years which contain a 11-month gap between the GRACE and GRACE-FO missions pose a challenge to an accurate assessment of key hydrological metrics. In particular, several gaps due to the lack of reliable measurements constrain the full potential of TWSA in, for example, drought studies and understanding the pace of climate change (e.g., <xref ref-type="bibr" rid="B55">Vishwakarma, 2020</xref>).</p>
<p>Several studies have attempted to reconstruct the TWSA series to cover long-term periods relying on different methods. For instance, <xref ref-type="bibr" rid="B26">Li et al. (2021)</xref> incorporated machine learning, analysis of time series, with techniques of statistical decomposition to globally reconstruct TWSA fields from 1979 to 2020. <xref ref-type="bibr" rid="B56">Wang et al. (2021)</xref> combined the GRACE data with soil moisture, precipitation, evapotranspiration, and temperature to reconstruct a long-term TWSA based on an extended short-term memory model. A simple linear version combining TWSA above the Amazon together with sea surface temperature (SST) indices has additionally been proposed (<xref ref-type="bibr" rid="B10">de Linage et al., 2014</xref>). Utilizing GRACE-derived TWSA and <italic>in situ</italic> river discharge data, <xref ref-type="bibr" rid="B5">Becker et al. (2011)</xref> applied a principal component analysis, which makes a linear and steady time-series supposition, to reconstruct GRACE&#x2013;TWSA from 1980 to 2008 over the Amazon Basin. Other approaches include the use of an autoregressive model with the independent component analysis to predict TWSA in West Africa incorporating precipitation records and SST indices (<xref ref-type="bibr" rid="B19">Forootan et al., 2014b</xref>). However, this autoregressive version assumes a constant status of TWSA over the area and the prediction accuracy decreases after a 2-year forecast length. The water balance approach has also been applied to increase the TWSA series back to 1980 (cf. <xref ref-type="bibr" rid="B58">Yin et al., 2019</xref>). This approach uses multi-source datasets as inputs in the terrestrial water budget equation. All examples mentioned here require the use of mathematical models. It must be mentioned that the formulation of these techniques, which is primarily based on experimental datasets, and the rise in performance, has frequently been undertaken by way of increased model complexity, and the manner that they come to decisions, makes them a pattern/machine learning recognition problem (<xref ref-type="bibr" rid="B57">Wilby et al., 2003</xref>).</p>
<p>There is no mathematical model that can efficiently describe hydrological phenomena (cf. <xref ref-type="bibr" rid="B34">Mukhopadhyay, 2003</xref>). However, algorithms that make supposition(s) of the time-series with adaptive abilities provide an excellent alternative to predict the TWSA fields over a region. Consequently, many studies have explored the feasibility of artificial neural networks (ANNs) to reconstruct the TWSA series due to their ability to model linear and non-linear systems based on learning and prediction algorithms (<xref ref-type="bibr" rid="B3">Ahmed et al., 2019</xref>). ANN extracts complex relationships between model inputs and targets and builds complex and non-linear relationships that are robust as a forecasting tool for hydrological variables. For instance, extended TWSA time- series using an ANN approach to examine the long-term hydrological properties of TWSA have been investigated by several authors (see, e.g., <xref ref-type="bibr" rid="B27">Long et al., 2014</xref>; <xref ref-type="bibr" rid="B61">Zhang et al., 2016</xref>; <xref ref-type="bibr" rid="B33">Mukherjee and Ramachandran, 2018</xref>; <xref ref-type="bibr" rid="B15">Ferreira et al., 2019</xref>; <xref ref-type="bibr" rid="B3">Ahmed et al., 2019</xref>; <xref ref-type="bibr" rid="B8">Chen et al., 2019</xref>, and references therein). Overall, these studies agreed that the ANN&#x2019;s performance improved when climatic observations were integrated with the GRACE&#x2013;TWSA datasets. Nevertheless, this might be a disadvantage since the accuracy of the reconstruction depends a lot on data availability, especially for architectures with many layers. For many regions and river basins, this might impose limitations in using ANN. As a result, economical methods that can still faithfully reconstruct actual observations would be preferable, especially over data-poor regions. The present study proposes the use of a new approach, the boosted regression tree (BRT) technique to reconstruct the TWSA series.</p>
<p>The BRT technique depends on the insights and methodologies of both statistical and machine-learning approaches. This method varies mainly from conventional regression strategies, which produce a single excellent model, rather than utilizing the boosting approach to adaptively combine a large number of several simple tree models to improve the predictive process (<xref ref-type="bibr" rid="B13">Elith et al., 2006</xref>; <xref ref-type="bibr" rid="B24">Leathwick et al., 2006</xref>; <xref ref-type="bibr" rid="B25">Leathwick et al., 2008</xref>). The boosting process utilized in BRT locates its origins within machine learning (<xref ref-type="bibr" rid="B47">Schapire, 2003</xref>). However, posterior evolutions within the society of statistics re-explain it as a developed type of regression (<xref ref-type="bibr" rid="B20">Friedman et al., 2000</xref>). BRT has many vital benefits of tree-based strategies: 1) it could be used with an assortment type of response (binomial, Gaussian, and Poisson) through specifying the distribution of the error and the link function; 2) it contains a probabilistic or random component, which improves predictive performance, decreasing the definitive model variance through the use of just a random data subset to adequate every new tree (<xref ref-type="bibr" rid="B21">Friedman, 2002</xref>); 3) the algorithm automatically detects the best fit; 4) the model shows the impact of each predictor on the reconstruction after accounting for their overall contributions; and 5) the algorithm is robust and unaffected by missing values and outliers (<xref ref-type="bibr" rid="B1">Abeare, 2009</xref>). Fitting numerous trees in BRT overcomes the most significant obstacle of single tree models (i.e., their comparatively weak prediction achievement). BRT models are complicated; however, they can be concise in forms which provide a robust hydrological perception. Thereby, BRT is suitable for many environmental applications as well.</p>
<p>The main aim of this study is to evaluate the use of BRT to reconstruct the TWSA series of the Yangtze River basin (YRB), China. So far, BRT has been used only in groundwater level prognosis (<xref ref-type="bibr" rid="B40">Rahman et al., 2020</xref>; <xref ref-type="bibr" rid="B49">Sharafati et al., 2020</xref>) and, as far as we know, this study presents the first application of BRT to fill the missing gaps in the GRACE-derived TWSA. Furthermore, a comparison of the performance of BRT and ANN techniques has not been attempted in recent few studies that focused on TWSA reconstruction. Therefore, the focus of this study is to generate a continuous and uninterrupted TWSA series and develop a robust predictive technique that can backcast TWSA to address the hydrological and environmental problems over a given river basin. Furthermore, this study compares BRT outputs with those from a non-linear&#x2013;autoregressive neural network with exogenous inputs (NARX) to define the most accurate method. Due to the nature of GRACE&#x2013;TWSA, it has a statistical and physical relationship with the hydro-climatic variables (e.g., precipitation and soil moisture). For instance, <xref ref-type="bibr" rid="B31">Mo et al. (2016)</xref> found a strong correlation between precipitation and TWSA in southern China. Also, the availability of TWSA affects evapotranspiration and runoff (ibid). <xref ref-type="bibr" rid="B30">Ma et al. (2017)</xref> indicated that GRACE observations and Climate Change Initiative Soil Moisture could be used as significant indices of the spatial allocation of the drought procedure and its effect on the environment and local communities. This could improve water resource management and the early detection and monitoring of droughts. Consequently, the present study also uses a comprehensive and different data spectrum, replicating the dynamics in the energy and water cycles that affect TWSA for training the network over the YRB. Hence, the performance of the BRT model is the focus of the analyses, whilst also assessing the relative importance of the predictors used to reconstruct the TWSA.</p>
</sec>
<sec id="s2">
<title>2 Study Area</title>
<p>The Yangtze River is the longest in Asia, with a length of approx. 6,397&#xa0;km. It flows from the Tibetan Plateau and runs through Qinghai, then turns south to Sichuan and Tibet; after that, it reaches Yunnan, Chongqing, and continues to Hubei, Hunan, running through Jiangxi, Anhui, and Jiangsu, and then emptying into the East China Sea near Shanghai. Its basin (hereafter YRB), extends for about 3,200&#xa0;km from west to east and more than 1,000&#xa0;km from north to south and drains an area of 1.8 &#xd7; 10<sup>6</sup>&#xa0;km<sup>2</sup>, nearly one-fifth of the total land area of China (<xref ref-type="fig" rid="F1">Figure 1</xref>). The YRB has succumbed to considerable modifications in climate and land cover/use, including the largest hydroelectric power station in the world (Three Gorges Dam&#x2014;TGD). The TGD&#x2019;s reservoir is the most vital anthropogenic feature in the YRB. It extends for 2.3&#xa0;km with 185&#xa0;m in height.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Location map of the Yangtze River basin, China, and its main surface waters. Source: adapted from <xref ref-type="bibr" rid="B16">Ferreira et al. (2020a)</xref>.</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g001.tif"/>
</fig>
<p>The Yangtze River is very famous and has a significant role in China&#x2019;s development of its economy, agriculture, tourism, transportation, culture, etc. Albeit for climate and water resource fields, the Qingling Mountain and Huaihe River are the more commonly recognized borders between northern and southern China. The Yangtze River is also perceived as the north&#x2013;south boundary, at least from a cultural perspective. The climate in the north of the Yangtze River is dry with low temperatures and light rain, whereas, in the south, the climate is humid and warm with sufficient rainfall. Climate variation, floods and drought events, and irrigation have profoundly affected the water resources, bringing significant impacts on humans and nature. Three severe catastrophic floods happened in the YRB in 1931, 1956, and 1998. Although catastrophic floods like these have not happened in the YRB since the beginning of the 21st century, the YRB has faced a lot of medium and small floods. For instance, eight drought events have been identified in the YRB during the GRACE era, with three major droughts occurring in 2004, 2006, and 2011 (<xref ref-type="bibr" rid="B51">Sun et al., 2018</xref>).</p>
</sec>
<sec id="s3">
<title>3 Materials and Methods</title>
<sec id="s3-1">
<title>3.1 Datasets</title>
<sec id="s3-1-1">
<title>3.1.1 Global Precipitation Climatology Centre Precipitation</title>
<p>The Global Precipitation Climatology Centre (GPCC) was established in 1989 at the request of the World Meteorological Organization (WMO). The National Meteorological Service of Germany runs it as a German contribution to the World Climate Research Program. GPCC&#x2019;s delegation is the worldwide analysis of monthly and daily precipitation on the Earth&#x2019;s land surface based on <italic>in situ</italic> rain gauge data.</p>
<p>The monthly GPCC data, specifically, the GPCC&#x2013;MP, gridded at a spatial resolution of 1&#xb0; were used in this study due to its long-term record. The series starts from 1982, offering sufficient data for long-time period studies, and is based on the monthly records acquired by the Global Telecommunication System (GTS) of the WMO from about 7,000 to 9,000 stations (after high-level quality control). Generally, the GPCC&#x2013;MP is known as the best <italic>in situ</italic> and GTS-based monthly land&#x2013;surface precipitation reference product publicly available. To ensure the consistency of the time-series and reveal errors in the station metadata, the harmonization of station metadata and a sophisticated quality control is critical for GPCC to integrate several datasets. The data were retrieved from an online database, and further information is available at <xref ref-type="bibr" rid="B48">Schneider et al. (2013)</xref>. The particular choice for this product is supported by the assessment and investigations carried out by <xref ref-type="bibr" rid="B59">Yu et al. (2020)</xref> over mainland China.</p>
</sec>
<sec id="s3-1-2">
<title>3.1.2 ERA-Interim Data System</title>
<p>To model the response of TWSA to evapotranspiration and temperature changes, instantaneous moisture flux (IE, equivalent to evapotranspiration), surface temperature (soil temperature level 1&#x2014;SMTL1), soil temperature level 2/3/4 (SMTL2, SMTL3, and SMTL4), and 2-meter temperature (T2m) fields were retrieved from the ERA-Interim data system. These datasets were all obtained at a monthly temporal interval and gridded at a spatial resolution of 1&#xb0;. The long-term consistency was the motivation to select the ERA-Interim reanalysis data for this study (cf. <xref ref-type="bibr" rid="B18">Forootan et al., 2014a</xref>).</p>
</sec>
<sec id="s3-1-3">
<title>3.1.3 GLDAS&#x2013;Noah and GLDAS&#x2013;Variable Infiltration Capacity</title>
<p>Soil moisture (the aggregate of all the layers from 0 to 2&#xa0;m in depth), canopy, and snow storages from Global Land Data Assimilation Systems (GLDAS, <xref ref-type="bibr" rid="B43">Rodell et al., 2004b</xref>) driven by Noah in its version 2, which covers the period from 1948 to 2015, was used in this study as a predictor. We choose these data due to their availability over long periods. GLDAS&#x2013;Noah version 2 datasets consist of 1&#xb0; gridded data with a temporal resolution of 1&#xa0;month.</p>
<p>For evaluating the performance of the BRT and ANN models, a closed-loop simulation using &#x201c;independent&#x201d; TWSA datasets from the GLDAS drive Variable Infiltration Capacity (VIC) land surface model L4, version 2, was considered. The GLDAS&#x2013;VIC monthly product consists of 1&#xb0; gridded data covering the period 1948 to 2015. These data were chosen due to their availability over long periods. Moreover, the GLDAS&#x2013;VIC model creates the simulation outcomes that are nearest to the <italic>in situ</italic> data, and it additionally has the lowest dispersions and bias error values compared with other GLDAS streams.</p>
</sec>
<sec id="s3-1-4">
<title>3.1.4 Climate Indices</title>
<p>To model the response of YRB to the ENSO phenomenon, Bivariate ENSO Time-series (BEST, cf. <xref ref-type="bibr" rid="B50">Smith and Sardeshmukh, 2000</xref>), which is derived from the Southern Oscillation Index (SOI) and Ni&#xf1;o 3.4 was used. The BEST index incorporates the oceanic (Ni&#xf1;o 3.4) and atmospheric (SOI) components of ENSO processes into a particular field, and therefore, gives a more accurate description of the phenomenon. The time-series of worldwide temperature anomalies was also utilized to simulate the impact of global warming on TWSA variability, as shown by <xref ref-type="bibr" rid="B12">Dong et al. (2019)</xref>. Over the YRB, it has been shown that the correlation between the eco-flow metrics and selected de-trended climate indices is strong, particularly for the synchronous Northern Hemisphere and Indian Ocean Dipole indices, as further explained by <xref ref-type="bibr" rid="B12">Dong et al. (2019)</xref>. Moreover, these authors (ibid) indicated that the seasonal streamflow correlated more with selected climate indices than the annual streamflow. Thereby, the reconstruction of TWSA over the YRB also needs to consider such climate indices as predictors.</p>
</sec>
<sec id="s3-1-5">
<title>3.1.5 Gravity Recovery and Climate Experiment&#x2013;Terrestrial Water Storage Anomaly Series</title>
<p>The GRACE-derived TWSA datasets used on this study are the so-called Level-3 products (<xref ref-type="bibr" rid="B23">Landerer and Swenson, 2012</xref>). They comprise monthly gridded values at a spatial resolution of 1&#xb0;-by-1&#xb0; based on the spherical harmonic coefficients provided by the Center for Space Research (CSR). All details regarding the processing procedures and caveats are available in the company publication by <xref ref-type="bibr" rid="B23">Landerer and Swenson (2012)</xref>. Albeit TWSA fields were synthesized at a spatial resolution of 1&#xb0;-by-1&#xb0;, they are still limited to the nominal resolution of GRACE, which is 3&#xb0;-by-3&#xb0;. Nevertheless, scaling factors such as those computed by <xref ref-type="bibr" rid="B23">Landerer and Swenson (2012)</xref> can be used to improve the spatial resolution of GRACE&#x2013;TWSA to 1&#xb0;-by-1&#xb0;. The scale factor used is the one computed by <xref ref-type="bibr" rid="B28">Long et al. (2015)</xref>. To this end, the TWSA monthly grids refer to a temporal baseline of 2004&#x2013;2009 at which the mean was subtracted.</p>
<p>The temporal time mean was also removed from the respective datasets (<xref ref-type="sec" rid="s3-1-1">Sections 3.1.1</xref>&#x2013;<xref ref-type="sec" rid="s3-1-4">3.1.4</xref>) for the period 2004&#x2013;2009. <xref ref-type="fig" rid="F2">Figure 2</xref> shows the correlation coefficient between TWSA and the predictors described in the aforementioned sub-sections. Overall, there is a good correspondence between TWSA and SM (0.887), and TWSA and P (0.612).</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Pearson correlation coefficients (PCCs) between TWSA and the predictors described at <xref ref-type="sec" rid="s3-1-1">Sections 3.1.1</xref>&#x2013;<xref ref-type="sec" rid="s3-1-4">3.1.4</xref>.</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g002.tif"/>
</fig>
</sec>
</sec>
<sec id="s3-2">
<title>3.2 Methods</title>
<p>The methodological approach implemented in this study consists of the steps summarized in <xref ref-type="fig" rid="F3">Figure 3</xref> and is further described in the following sub-sections.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Flowchart of the primary process steps to reconstruct the GRACE-derived terrestrial water storage anomaly (TWSA) based on BRT and ANN (NARX) algorithms. The flowchart also shows the steps necessary for evaluating the reliability of the reconstructions using GLDAS&#x2013;VIC-simulated TWSA.</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g003.tif"/>
</fig>
<sec id="s3-2-1">
<title>3.2.1 Boosted Regression Tree</title>
<p>BRT, also known as stochastic gradient boosting, is one of many techniques that aims to enhance the performance and precision of the prediction of a single model by fitting several models and combining them to get the best prediction. The ability of the BRT method to enhance precision is based on the assumption that it is more straightforward to find and average many rough prediction rules other than to obtain a single high-precision prediction rule (<xref ref-type="bibr" rid="B47">Schapire, 2003</xref>). BRT is an effective technique because it combines two approaches: regression trees, which are from the classification and the regression tree (decision tree) set of models, and boosting builds, which combines a group of models (<xref ref-type="bibr" rid="B14">Elith et al., 2008</xref>).</p>
<sec id="s3-2-1-1">
<title>3.2.1.1 Regression Tree</title>
<p>The regression tree is created through a bilateral iterative division, a repeated operation that divides the data into branches or segmentations. After that, it resumes by splitting every branch into smaller sets as the process moves up every branch.</p>
<p>Initially, all records in the training set (the priory categorized records that are utilized to define the tree structure) are collected into the same partition. The algorithm then begins allocating the data into the first two segments, utilizing each potential bilateral division on each field. Then, the algorithm selects the split that minimizes the sum of the squared deviations from the mean in two separate segmentations. After that, this splitting base is utilized in each of the new partitions. This procedure will continue until every node amounts to the minimal node size set by the user and becomes a leaf node. (That is, when the sum of the squared deviations from the average in a node is zero, that node is deemed a leaf node even if it does not amount to the minimal size). All randomly selected subsets contain a similar number of data points, and the points are chosen from the entire data set. For example, <xref ref-type="fig" rid="F4">Figure 4</xref> shows two predictor variables <italic>X</italic>
<sub>1</sub> and <italic>X</italic>
<sub>2</sub>, which might be surface temperature and precipitation, and the response <italic>Y</italic>, the mean adult weight of types. Areas <italic>Y</italic>
<sub>1</sub>, <italic>Y</italic>
<sub>2</sub>, and so on, are leaves, and <italic>t</italic>
<sub>1</sub>, <italic>t</italic>
<sub>2</sub>, and so forth are the dividing points.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>
<bold>(A)</bold> shows a single regression tree with a response <italic>Y</italic>, in which <italic>X</italic>
<sub>1</sub> and <italic>X</italic>
<sub>2</sub> are two predictor variables, and <italic>t</italic>
<sub>1</sub>, <italic>t</italic>
<sub>2</sub>, etc. are split points. <bold>(B)</bold> shows the regression tree&#x2019;s prediction surface. Source: Adapted from (<xref ref-type="bibr" rid="B22">Hastie et al., 2009</xref>, p. 306).</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g004.tif"/>
</fig>
</sec>
<sec id="s3-2-1-2">
<title>3.2.1.2 Boosting the Regression Tree&#x2014;Boosted Regression Tree</title>
<p>Boosting is a technique that integrates the weak learners output (regression trees) to provide a stronger and amended predictive overall performance. Wherefore, the definitive model (BRT) would be a combination of several individual regression trees, fitted in a forward step-wise approach (<xref ref-type="bibr" rid="B14">Elith et al., 2008</xref>).</p>
<p>An efficient design for fitting a single decision tree is to grow a bigger tree. Afterward, one can prune it by collapsing the weakest links identified through cross-validation (<xref ref-type="bibr" rid="B22">Hastie et al., 2009</xref>).</p>
<p>Boosting is a numerical development approach to lessen the loss function through adding a new tree in each step that substantially lessens the loss function. The initial regression tree in BRT maximally lessens the loss function for the chosen tree size. Then, for every next step, the concentration is on the residuals: on variance in the response that the model has still not illustrated. The mean squared error (MSE) is a measure of the goodness of suitability. It computes the squared distance among an estimator and the anticipated parameter, which is given by:<disp-formula id="e1">
<mml:math id="m1">
<mml:mi>L</mml:mi>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
</mml:mfenced>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
</mml:math>
<label>(1)</label>
</disp-formula>where <italic>L</italic> is the training loss function, <italic>&#x3b8;</italic> is the parameters, and <italic>y</italic> is the prediction made from the training data (input <italic>X</italic>); <inline-formula id="inf1">
<mml:math id="m2">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> is the prediction given by<disp-formula id="e2">
<mml:math id="m3">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>.</mml:mo>
</mml:math>
<label>(2)</label>
</disp-formula>
</p>
<p>In boosting, models are fitted iteratively to the training records, gradually utilizing proper techniques to emphasize the observations modeled badly by using the current series of trees. Boosting algorithms differ in quantifying the shortage of suitability and deciding on the settings for the following repetition.</p>
<p>The BRT method has four essential features that have been applied in this study. They are:<list list-type="simple">
<list-item>
<p>1. The process is random (it contains a probabilistic or random factor). This random process enhances the predictive performance and lessens the variance of the definitive model, utilizing just a random subset of records to every new suitable tree (<xref ref-type="bibr" rid="B21">Friedman, 2002</xref>). This means that if a random seed is not set initially, the final models will be totally different at each run.</p>
</list-item>
<list-item>
<p>2. The consecutive model-fitting procedure builds on pre-fitted trees and concentrates more and more on predicting the most challenging observations. This differentiates the operation from one where a big tree is fitted to the data-series. Even so, if the ideal match was one tree, it might possibly be fitted through a sum of similar shrunken versions of itself in a boosted model.</p>
</list-item>
<list-item>
<p>3. Two critical parameters that are required to be set by the user:</p>
<list list-type="simple">
<list-item>
<p>a. Tree complexity (TC): this parameter specifies the split number in each tree. A TC value of 1 produces trees with just one split, meaning that the version ignores interactions among environmental variables. A TC value of 2 produces two splits and so forth.</p>
</list-item>
<list-item>
<p>b. Learning rate (LR&#x2014;also known as the shrinkage parameter): A number between 0 and 1 identifies the rate that the algorithm has to converge and defines the contribution of every tree to the growth model. LR is inversely related to the number of repetitions needed for the algorithm to complete; since the value of LR is slight, numerous trees are created.</p>
</list-item>
</list>
</list-item>
</list>
</p>
<p>Together, these two parameters TC and LR define the number of trees needed for an optimum prediction. The aim is to find the combination of parameters that lead to the minimal error for the predictions. As a general rule, it is advisable to utilize a collection of tree complexity and learning rate values that produces a model containing a minimum of 1,000 trees. The optimum &#x201c;TC&#x201d; and &#x201c;LR&#x201d; values are contingent on the magnitude of the dataset, e.g., for datasets with less than 500 occurrence points (or epochs, as it is the case in this study). It is preferable to design simple trees (&#x201c;TC&#x201d; &#x3d; 2 or 3) with learning rates sufficiently small to allow the model to reach the minimum of 1,000 trees.<list list-type="simple">
<list-item>
<p>4. Prediction from the BRT technique is simple; however, interpretation needs tools to identify which interactions and variables are important, and to visualize fitted functions (<xref ref-type="bibr" rid="B14">Elith et al., 2008</xref>).</p>
</list-item>
</list>
</p>
<p>The prediction in this study was achieved using the following predictors: precipitation (P), surface temperature (SMTL1), soil temperature (level 2/3/4) (SMTL2, SMTL3, SMTL4), surface air pressure (SP), soil moisture (SM), 2-meter temperature (T2m), instantaneous moisture flux (IE), and climate indices (CI). <xref ref-type="fig" rid="F2">Figure 2</xref> shows the correlation among them as well as with TWSA.</p>
<p>One of the BRT algorithm advantages is the easiness with which the influence of the predictors may be evaluated and largely disregards uninformative predictors while preparing trees.</p>
<p>Regularization is necessary for BRT due to its sequential model fitting, which lets trees to be added till the data are completely overfitted. This overfitting results in a poor performance on accurate data. BRT regularization includes the LR, optimization of tree number (NT), and TC altogether. The aim is to find the combination of parameters (LR, NT, and TC) that performs the minimal predictive error. BRT&#x2019;s regularization and shrinkage are done using the Lasso method (most minor absolute shrinkage and selection operator). The Lasso method shrinks several coefficients and fixes others to 0, and it attempts to keep the good features of both subset selection and ridge regression.</p>
</sec>
</sec>
<sec id="s3-2-2">
<title>3.2.2 Non-linear Autoregressive Neural Network With Exogenous Inputs&#x2014;NARX</title>
<p>In this study, we used the NARX in the network design. NARX is an artificial neural network that also includes repetitive feedback from many network layers to the input layer (<xref ref-type="bibr" rid="B4">Ardalani-Farsa and Zolfaghari, 2010</xref>). Many researchers have vastly utilized it to model non-linear prediction processes (<xref ref-type="bibr" rid="B3">Ahmed et al., 2019</xref>; <xref ref-type="bibr" rid="B15">Ferreira et al., 2019</xref>). The NARX architecture predicts a signal via regressing the initial output signal values and the initial values of an independent (exogenous) input signal.</p>
<p>In this study, the NARX reconstruction model utilized 18 hidden layers. (Hereafter, NARX will be addressed simply as ANN.) These layers were adjusted by using a Bayesian regularization back propagation learning rule. The sigmoid transfer function was also utilized. The independent inputs consist of the same predictors that were used in BRT. After preparing the needed exogenous variables, the network was trained using the training period from April 2002 to November 2014. In the network designing, 70% of the data were used for training the network, 10% to validate and stop the training prior to overfitting, and 20% for testing (utilized as independent data). We trained the network with an open loop. After training and testing the network, the outputs from the ANN were validated using the metrics shown in <xref ref-type="sec" rid="s3-2-3">Section 3.2.3</xref>. After that, the trained network was used to reconstruct the GRACE&#x2013;TWSA from March 2002 to January 1982.</p>
</sec>
<sec id="s3-2-3">
<title>3.2.3 Assessment and Performance Measures</title>
<p>To assess the reliability of the BRT, and due to the lack of GRACE&#x2013;TWSA, the reconstruction process was also validated via creating an akin network to predict TWSA from GLDAS&#x2013;VIC, which is talented with a long-period time-series (1948&#x2013;2015). This network was trained to predict GLDAS&#x2013;VIC&#x2013;TWSA (GLDAS&#x2013;TWSA<sub>BRT</sub>) from April 2002 to November 2014, after that, the trained network was utilized to backcast TWSA from March 2002 to January 1982. The reconstructed GLDAS&#x2013;VIC time series from (March 2002 to January 1982) and the authentic datasets were utilized to validate the outputs from the BRT.</p>
<p>Likewise, to assess the reliability of ANN in reconstructing the long-period TWSA, GLDAS&#x2013;VIC was utilized in a &#x201c;closed-loop&#x201d; simulation to evaluate the goodness of the extended TWSA series from March 2002 to January 1982. The networks were trained with the same predictors (exogenous variables) as those of GRACE&#x2013;TWSA (<xref ref-type="fig" rid="F3">Figure 3</xref>) for the same duration (April 2002 to November 2014). Afterward, the network was used to predict GLDAS&#x2013;VIC TWSA (GLDAS-TWSA<sub>ANN</sub>) from January 1982 to March 2002, and the outcomes were compared to the original GLDAS&#x2013;VIC TWSA dataset. The same process was repeated for BRT reconstruction.</p>
<p>The performance of the reconstructed TWSA series was determined using the Nash&#x2013;Sutcliffe efficiency (NSE) coefficient, and the root-mean-square error (RMSE) given as (e.g., <xref ref-type="bibr" rid="B32">Moriasi et al., 2007</xref>):<disp-formula id="e3">
<mml:math id="m4">
<mml:mtext>NSE</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>rec</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mtext>TWSA</mml:mtext>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
<label>(3)</label>
</disp-formula>and<disp-formula id="e4">
<mml:math id="m5">
<mml:mtext>RMSE</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:munderover accentunder="false" accent="false">
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>rec</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msqrt>
<mml:mo>,</mml:mo>
</mml:math>
<label>(4)</label>
</disp-formula>respectively.</p>
<p>The Pearson&#x2019;s correlation coefficient (PCC), given as:<disp-formula id="e5">
<mml:math id="m6">
<mml:mtext>PCC</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>rec</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>rec</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mtext>TWSA</mml:mtext>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>rec</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>rec</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msqrt>
<mml:msqrt>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:msup>
<mml:mrow>
<mml:mfenced open="(" close=")">
<mml:mrow>
<mml:mtext>TWS</mml:mtext>
<mml:msub>
<mml:mrow>
<mml:mtext>A</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
<mml:mo>,</mml:mo>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mtext>TWSA</mml:mtext>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:mfrac>
<mml:mo>,</mml:mo>
</mml:math>
<label>(5)</label>
</disp-formula>was used to describe the degree of collinearity between the simulated and observed data.</p>
<p>In <xref ref-type="disp-formula" rid="e3">Eqs 3</xref>&#x2013;<xref ref-type="disp-formula" rid="e5">5</xref>, the variables are as follow: <italic>t</italic> represents the length of the time series of TWSA (that is, the total number of months considered in the evaluation), TWSA<sub>rec</sub> is the resulting reconstructed TWSA series based on BRT or ANN, TWSA<sub>obs</sub> is the observed TWSA based on GRACE data, and <inline-formula id="inf2">
<mml:math id="m7">
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mtext>TWSA</mml:mtext>
</mml:mrow>
<mml:mo>&#x304;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mtext>obs</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:math>
</inline-formula> is the mean value of the observed TWSA series.</p>
</sec>
</sec>
</sec>
<sec id="s4">
<title>4 Results</title>
<sec id="s4-1">
<title>4.1 Terrestrial Water Storage Anomaly&#x2019;s Reconstruction Using the Boosted Regression Tree and Artificial Neural Network</title>
<p>We partitioned the data into training and testing sets using 80% of the data randomly assigned to the training set, and 20% of the data randomly assigned as the testing set (we got the best results with this partitioning percentage). After several trial attempts to find the appropriate values of the parameters to obtain an optimal accuracy of the TWSA prediction, it was found that the TC &#x3d; 5 and LR &#x3d; 0.0035 with 2,000 trees provided the best results over the YRB. The number of trees after the regularization and shrinkage was 200. <xref ref-type="fig" rid="F5">Figures 5A,C</xref> show the fitting against training and testing data for TWSA, respectively. Hence, inspecting the reconstructed values from the testing step, we found an overall agreement with the actual values of the TWSA series for the specific months (<xref ref-type="fig" rid="F5">Figure 5C</xref>). The deviation residuals are used as a loss function to assess the reconstruction, which in terms of RMSE has a value of 18.94&#xa0;mm. Furthermore, the NSE coefficient based on the comparison between the actual and reconstructed TWSA series in the testing step (<xref ref-type="fig" rid="F5">Figure 5C</xref>) presents a value of approximately 0.89 and a PCC of 0.95 (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>
<bold>(A,B)</bold> show the training stage of the prediction of the TWSA series for the YRB based on BRT and ANN, respectively. <bold>(C,D)</bold> show the test stage of the TWSA series of the YRB based on BRT and ANN, respectively. <bold>(E,F)</bold> show the predictors&#x2019; importance in both BRT and ANN methods, respectively.</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g005.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Summary statistics for the reconstructed GRACE&#x2013;TWSA based on BRT and ANN during the validation stage using 20% of the whole time series.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Product</th>
<th align="center">RMSE [mm]</th>
<th align="center">NSE [unitless]</th>
<th align="center">PCC [unitless]</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">GRACE-TWSA<sub>BRT</sub>
</td>
<td align="char" char=".">18.94</td>
<td align="char" char=".">0.89</td>
<td align="char" char=".">0.95</td>
</tr>
<tr>
<td align="left">GRACE-TWSA<sub>ANN</sub>
</td>
<td align="char" char=".">20.34</td>
<td align="char" char=".">0.87</td>
<td align="char" char=".">0.93</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Likewise, the ANN was used in this study to reconstruct GRACE&#x2013;TWSA backward from March 2002 to January 1982 precisely in the same way as BRT. In an open loop, the network was trained and tested from April 2002 to November 2014. The optimal ANN model used to backcast GRACE&#x2013;TWSA over the YRB was chosen from all possible combinations of neurons and delays. <xref ref-type="fig" rid="F5">Figures 5B, D</xref> show the time-series response during the training and the test stages, respectively. Upon training and testing the network, the results show that the accuracy of the network in terms of RMSE value is 20.34&#xa0;mm (<xref ref-type="table" rid="T1">Table 1</xref>). This shows an underperformance of the ANN-reconstructed series of about 6.9% in terms of the BRT-based reconstruction. Furthermore, the NSE presents a value of approximately 0.87, and the PCC shows a value of 0.93 (<xref ref-type="table" rid="T1">Table 1</xref>), slightly lower than those based on the BRT evaluation (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<p>The relative importance of the predictors used in the BRT model shows that soil moisture (SM) is the most important variable in TWSA reconstruction over the YRB showing a relative contribution of about 81.9%. Conversely, soil temperature level 2 (SMTL2) has the lowest importance, with a contribution of about 1.0%. Likewise, <xref ref-type="fig" rid="F5">Figure 5F</xref> indicates the relative importance of the input variables (predictor importance) of the predictors used in the ANN model. It can be seen that most of the variables present relative contributions between 11% and 14% (<xref ref-type="fig" rid="F5">Figure 5F</xref>). SM usually shows a significantly positive correlation with variations of regional TWSA (<xref ref-type="fig" rid="F2">Figure 2</xref>). However, SM presents the lowest contribution with a relative weight of 3.1% for the overall reconstruction of the TWSA series over YRB; the same holds for the instantaneous moisture flux (IE), 6.8%, and T2m, 3.9%. However, ANN models may be complicated, and deciding which predictor is more valuable can be difficult without further experiments, which is beyond the scope of the present work.</p>
<p>The reconstructed TWSA time-series covering the 32&#xa0;years from January 1982 to December 2014 based on the respective training for BRT and ANN as described previously were undertaken (<xref ref-type="fig" rid="F6">Figure 6</xref>). The missing values are seen in the original GRACE&#x2013;TWSA series (<xref ref-type="fig" rid="F6">Figure 6</xref>) and were also provisioned in the reconstruction. The overall behaviors of the maximum and minimum amplitudes over the backcasted period (January 1982 to March 2002) are consistent with the observed data period (actual) covering the period from April 2002 to December 2014. As already mentioned and presented in <xref ref-type="fig" rid="F5">Figures 5A, C</xref>, the overall match between reconstructed and the actual TWSA series is seen for BRT-based results (<xref ref-type="fig" rid="F6">Figure 6</xref>). Generally, ANN-based results overestimate the high (e.g., early 2014) and low amplitudes (e.g., middle 2004). Its high RMSE value of 20.34&#xa0;mm confirms these discrepancies compared to BRT (18.94&#xa0;mm) from April 2002 to December 2014 (<xref ref-type="table" rid="T1">Table 1</xref>).</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Time series of TWSA predicted by the BRT and ANN (1982&#x2013;2014) and those observed (April 2002&#x2013;December 2014).</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g006.tif"/>
</fig>
<p>Likewise, from January 1982 to March 2002, the ANN-reconstructed TWSA series generally presented amplitudes higher than those based on the BRT algorithm. Nevertheless, the BRT-reconstructed TWSA series showed higher amplitudes; for example, in the middle 1987 and 1989 periods. Notably, the lower amplitudes of TWSA are from 1990 to 1994, which could be associated with a mild drought during this period. Nevertheless, whatever could be the use and application of the GRACE&#x2013;TWSA reconstructed time-series (<xref ref-type="fig" rid="F6">Figure 6</xref>), assessing the algorithms are still necessary since there is no observed TWSA over the backcasted period (1982&#x2013;2001). Hence, a simulation is presented in the following (<xref ref-type="sec" rid="s4-2">Section 4.2</xref>) to address such a question.</p>
</sec>
<sec id="s4-2">
<title>4.2 Assessment of the Boosted Regression Tree and Artificial Neural Network for Reconstructing the Terrestrial Water Storage Anomaly&#x2014;A &#x201c;Closed-Loop&#x201d; Simulation</title>
<p>The aim of this experiment was two-fold: 1) to evaluate the performance of the BRT and ANN, and 2) to assess the reliability of the reconstructed series over the period of 1982&#x2013;2002.</p>
<p>A simulation of TWSA was implemented within a closed-loop process to estimate the goodness of the reconstructed TWSA series from 2002 to 1982. The simulations of TWSA are based on the water-storage compartments available in GLDAS&#x2013;VIC covering the period from January 1982 to December 2014 (<xref ref-type="sec" rid="s3-1">Section 3.1</xref>). The GLDAS&#x2013;VIC-simulated TWSA series was split into two parts: one from April 2002 to November 2014, just like the GRACE datasets, and another from January 1982 to March 2002 (the period to be reconstructed). The latter is used only for assessment purposes.</p>
<p>First, BRT reconstruction was carried out using the same predictors as described in <xref ref-type="sec" rid="s3-1">Section 3.1</xref>, with the only difference being the replacement of GRACE&#x2013;TWSA (April 2002&#x2013;November 2014) by the GLDAS&#x2013;VIC&#x2013;TWSA (April 2002&#x2013;November 2014). All the predictors were not taken from GLDAS&#x2013;VIC, thereby being an independent evaluation. Second, as with BRT, the reconstruction using the ANN&#x2013;NARX based on GLDAS&#x2013;VIC&#x2013;TWSA was also carried out. <xref ref-type="fig" rid="F7">Figure 7</xref> shows the reconstructed TWSA time-series based on BRT and ANN (GLDAS&#x2013;TWSA<sub>BRT</sub> and GLDAS&#x2013;TWSA<sub>ANN</sub>) as well as the original GLDAS&#x2013;TWSA series (GLDAS&#x2013;TWSA<sub>obs</sub>).</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>Reconstructed time series of GLDAS&#x2013;TWSA; the blue line is the original GLDAS&#x2013;TWSA time series (observation), the red line is the GLDAS&#x2013;TWSA time series as estimated by BRT, and the green line is the GLDAS&#x2013;TWSA time series as estimated by ANN.</p>
</caption>
<graphic xlink:href="fenvs-10-917545-g007.tif"/>
</fig>
<p>The overall behaviors of the maximum and minimum amplitudes over the backcasted period (1982&#x2013;2001) by the BRT method (GLDAS&#x2013;TWSA<sub>BRT</sub>) are more consistent with the observed data amplitudes (GLDAS&#x2013;TWSA<sub>obs</sub>) in comparison with those amplitudes based on ANN (GLDAS&#x2013;TWSA<sub>ANN</sub>, see <xref ref-type="fig" rid="F7">Figure 7</xref>). Specifically, the GLDAS&#x2013;TWSA<sub>ANN</sub> series generally underestimate the maximum peaks, whereas the low peaks seem to agree with those based on BRT and the observed values.</p>
<p>In the assessment process and during the training and testing stages using GLDAS&#x2013;VIC&#x2013;TWSA over the period from April 2002 to November 2014, the BRT network performance presents an RMSE value of 5.68&#xa0;mm, NSE value of 0.94, and PCC value of 0.97 (<xref ref-type="table" rid="T2">Table 2</xref>). Furthermore, applying ANN to predict GLDAS&#x2013;VIC&#x2013;TWSA over the period April 2002 to November 2014, the performance of ANN presents an RMSE value of 5.72&#xa0;mm, NSE value of 0.94, and the PCC of 0.97 (<xref ref-type="table" rid="T2">Table 2</xref>). A marginal improvement in terms of RMSE of approximately 0.7% was found for BRT for the testing stage.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Summary statistics for the reconstructed GLDAS&#x2013;VIC&#x2013;TWSA based on BRT and ANN during the training stage and validation. The validation refers to the comparison between the reconstructed series and those observed in <xref ref-type="fig" rid="F7">Figure 7</xref>, that is, the closed-loop simulation.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Product</th>
<th align="center">Stage</th>
<th align="center">RMSE [mm]</th>
<th align="center">NSE [unitless]</th>
<th align="center">PCC [unitless]</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="left">GLDAS-TWSA<sub>BRT</sub>
</td>
<td align="center">Training</td>
<td align="char" char=".">5.68</td>
<td align="char" char=".">0.94</td>
<td align="char" char=".">0.97</td>
</tr>
<tr>
<td align="center">Validation</td>
<td align="char" char=".">6.93</td>
<td align="char" char=".">0.92</td>
<td align="char" char=".">0.96</td>
</tr>
<tr>
<td rowspan="2" align="left">GLDAS-TWSA<sub>ANN</sub>
</td>
<td align="center">Training</td>
<td align="char" char=".">5.72</td>
<td align="char" char=".">0.94</td>
<td align="char" char=".">0.97</td>
</tr>
<tr>
<td align="center">Validation</td>
<td align="char" char=".">7.30</td>
<td align="char" char=".">0.91</td>
<td align="char" char=".">0.96</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Nevertheless, a validation to assess the reliability of BRT and ANN algorithms to reconstruct GLDAS&#x2013;VIC&#x2013;TWSA over the period January 1982&#x2013;March 2002 was carried out. Contrary to what was done with GRACE&#x2013;TWSA, the GLDAS&#x2013;VIC&#x2013;TWSA series can be used to validate the reconstructed values since they are available over the desired period. Overall, the results of the BRT indicate more reliability with a performance better than ANN with an RMSE value of 6.93&#xa0;mm, NSE value of 0.92, and PCC value of 0.96 (<xref ref-type="table" rid="T2">Table 2</xref>). At the same time, the results of ANN present a value of RMSE of 7.30&#xa0;mm, NSE of 0.91, and PCC of 0.96 (<xref ref-type="table" rid="T2">Table 2</xref>).</p>
</sec>
</sec>
<sec id="s5">
<title>5 Discussion</title>
<p>Predictions gained from modeling and simulations are now considered an important goal of environmental studies, as they underpin important decisions by hydrologists and engineers, which can help inform on policy. With this in mind, the principal focus of this study was to reconstruct the actual time series of GRACE&#x2013;TWSA backward from 2014 to 1982 (32&#xa0;years). The reconstruction of the GRACE-derived TWSA over the YRB used BRT and ANN (represented by NARX) algorithms. Consequently, the contributions of the present work are 1) validating the BRT algorithm, given that errors are within a tolerable range such as the GRACE uncertainty range, and 2) providing an extended time-series that support studies such as droughts. Although several studies have considered the potential of TWSA reconstruction over the YRB (e.g., <xref ref-type="bibr" rid="B61">Zhang et al., 2016</xref>), none has considered the use of BRT to reconstruct TWSA.</p>
<p>First, BRT was used to reconstruct GRACE&#x2013;TWSA over the YRB, where 80% of the data were utilized for training, whereas the remaining 20% of the data were utilized for testing the network. Notably, this partitioning of data was selected after several trials to get the best accuracy. The model was constructed based on its physical relationships with ten hydro-climatic variables (the predictors). These variables are: precipitation (P), surface temperature (SMTL1), soil temperature (level 2/3/4) (SMTL2, SMTL3, SMTL4), surface air pressure (SP), soil moisture (SM), 2-meter temperature (T2m), instantaneous moisture flux (IE), and climate indices (CI). This network&#x2019;s results showed an RMSE value of 18.94 mm, NSE value of 0.89, and PCC value of 0.95. This shows the consistency of the reconstructed (predicted) and the observed (actual) TWSA series (<xref ref-type="fig" rid="F5">Figures 5A,C</xref>). Second, ANN was trained precisely in the same way as BRT, in which the performance of the series indicated a slight underperformance of about 7.4%, 2.2%, and 2.1%, respectively, in terms of RMSE, NSE, and PCC (cf. <xref ref-type="table" rid="T1">Table 1</xref>). Both methods present RMSE values within GRACE&#x2019;s overall accuracy of about 20&#x2013;30&#xa0;mm over most river basins (<xref ref-type="bibr" rid="B46">Scanlon et al., 2016</xref>). Although the data used in this study were of coarse spatial resolution (1&#xb0;-by-1&#xb0;), they were valuable to prove the effectiveness of both algorithms for prediction with an acceptable accuracy.</p>
<p>Because the BRT technique is insensitive to multi-collinearity and outliers, it can fit complicated non-linear relationships, and it can automatically deal with the interactive impacts among predictors (<xref ref-type="bibr" rid="B13">Elith et al., 2006</xref>; <xref ref-type="bibr" rid="B14">Elith et al., 2008</xref>; <xref ref-type="bibr" rid="B11">Dedman et al., 2017</xref>). Hitherto, BRT seems a highly feasible technique to reconstruct TWSA using only one predictor like soil moisture (<xref ref-type="fig" rid="F5">Figure 5E</xref>), and that is reasonable because SM is very similar and highly correlated with TWSA in the YRB (see <xref ref-type="fig" rid="F2">Figure 2</xref>, and also cf. <xref ref-type="bibr" rid="B16">Ferreira et al., 2020a</xref>). This result also aligns with the finds of <xref ref-type="bibr" rid="B35">Naghibi and Pourghasemi (2015)</xref>. They found that BRT used only eight variables selected from the original data (14 variables). Some authors also declared that a close model would be more steady and easier to generalize (<xref ref-type="bibr" rid="B7">Catry et al., 2009</xref>; <xref ref-type="bibr" rid="B54">Vilar et al., 2010</xref>). Conversely, ANN-based reconstruction seems to necessitate more predictors. It used all predictors to achieve the prediction process and showed that SM got the lowest contribution in the TWSA prediction (<xref ref-type="fig" rid="F5">Figure 5F</xref>). This seems to be an obvious advantage of BRT compared to ANN. One could rely upon only one of the most accurate datasets (e.g., precipitation) based on remotely sensed or <italic>in-situ</italic> measurements to reconstruct TWSA instead of using all potential predictors (compare <xref ref-type="fig" rid="F5">Figures 5E,F</xref>).</p>
<p>Finally, based on BRT and ANN, the GRACE&#x2013;TWSA was backcasted from December 2014 to January 1982 (<xref ref-type="fig" rid="F6">Figure 6</xref>). However, an important question regarding the suitability of the extended GRACE&#x2013;TWSA series is how reliable are GRACE&#x2013;TWSA reconstructed series (<xref ref-type="fig" rid="F6">Figure 6</xref>)? In the absence of the observed TWSA between January 1982 and March 2002, a closed-loop simulation using TWSA from GLDAS&#x2013;VIC to evaluate the reliability of BRT and ANN was considered. A period equivalent to the GRACE data (April 2002&#x2013;November 2014) was used to generate BRT and ANN and then reconstruct the GLDAS&#x2013;VIC TWSA till 1982 (<xref ref-type="fig" rid="F7">Figure 7</xref>). Both networks were trained to simulate GLDAS&#x2013;VIC TWSA based on their non-linear physical relationships with the ten hydro-climatic variables. The BRT results showed a slightly better accuracy than those based on ANN (<xref ref-type="table" rid="T2">Table 2</xref>). Overall, BRT and ANN showed excellent performances with RMSE values of 6.93 and 7.30&#xa0;mm, respectively. This finding aligns with those from previous studies (e.g., <xref ref-type="bibr" rid="B39">Pourghasemi and Rahmati, 2018</xref>), which proved that BRT has a better performance than ANN. Additionally, some studies evaluated several different machine-learning techniques and found that BRT performed better than other popular algorithms (see, e.g., <xref ref-type="bibr" rid="B9">Cunningham et al., 2011</xref>; <xref ref-type="bibr" rid="B35">Naghibi and Pourghasemi, 2015</xref>; <xref ref-type="bibr" rid="B38">Nolan et al., 2015</xref>; <xref ref-type="bibr" rid="B36">Naghibi et al., 2016</xref>, for an exhaustive comparison of BRT with other algorithms applied to different subjects). Considering the ratio between the RMSE of the reconstructed GRACE&#x2013;TWSA with those from GLDAS&#x2013;VIC&#x2013;TWSA during the training phases (<xref ref-type="table" rid="T1">Tables 1</xref>, <xref ref-type="table" rid="T2">2</xref>) for the respective algorithms (BRT and ANN), it is possible to derive scale factors to infer the respective RMSEs of GRACE&#x2013;TWSA of 23.10 and 25.96&#xa0;mm, respectively. Again, such accuracies are akin to that of the GRACE era TWSA. Hence, this indicates that the temporal series shown in <xref ref-type="fig" rid="F6">Figure 6</xref> can be used in hydrological studies such as hydrological drought characterizations and the assessment of long-term changes of TWSA. This could be the subject of a separate study.</p>
</sec>
<sec id="s6">
<title>6 Conclusion</title>
<p>In the case of long-term studies (e.g., drought and flood assessments), TWSA from GRACE and GRACE-FO missions cover a relatively short period of approximately 20&#xa0;years. This means that it cannot be effectively applied for impact assessments from droughts and floods, and deduce long-term water availability over the YRB. To address this limitation, this study compared two machine-learning approaches over the YRB to predict and reconstruct the TWSA back to 1982. To this end, boosted regression tree (BRT), a popular machine learning algorithm that increases the model&#x2019;s accuracy, was used to reconstruct GRACE&#x2013;TWSA. BRT is a robust algorithm that works very well with large datasets or when there are many hydro-climatic variables compared to the number of observations. They are also very robust in circumventing problems associated with missing values and outliers. This study found that BRT and artificial neural network (ANN, represented by a non-linear-autoregressive neural network with exogenous inputs&#x2014;NARX) methods appeared robust enough to sufficiently reconstruct GRACE&#x2013;TWSA over the YRB with accuracy akin to the GRACE dataset. The validation results of both techniques indicated that the BRT technique is a more reliable and &#x201c;economic&#x201d; model to reconstruct TWSA over the YRB. That is, the most correlated predictors, in our case, soil moisture and precipitation, could be enough to reconstruct the TWSA time-series. Hence, the method is highly recommended for study areas where only a few datasets are available as predictive variables (e.g., soil moisture and/or precipitation).</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="data-availability">
<title>Data Availability Statement</title>
<p>Publicly available datasets were analyzed in this study. These data can be found here: GPCC precipitation available by Deutscher Wetterdienst at <ext-link ext-link-type="uri" xlink:href="https://opendata.dwd.de/climate_environment/GPCC/html/download_gate.html">https://opendata.dwd.de/climate_environment/GPCC/html/download_gate.html</ext-link>; ERA Interim datasets are available by the ECMWF at <ext-link ext-link-type="uri" xlink:href="https://apps.ecmwf.int/datasets/data/interim-full-moda/levtype=sfc/">https://apps.ecmwf.int/datasets/data/interim-full-moda/levtype&#x003D;sfc/</ext-link>; GLDAS fields are available by The NASA Goddard Earth Sciences Data and Information Services Center (GES DISC) at <ext-link ext-link-type="uri" xlink:href="https://ldas.gsfc.nasa.gov/gldas/gldas-get-data">https://ldas.gsfc.nasa.gov/gldas/gldas-get-data</ext-link>; the climate indices was retrieved from the NOAA Physical Sciences Laboratory (PSL) through the link <ext-link ext-link-type="uri" xlink:href="https://psl.noaa.gov/data/climateindices/list/">https://psl.noaa.gov/data/climateindices/list/</ext-link>; and the GRACE-TWSA monthly grids are available at <ext-link ext-link-type="uri" xlink:href="https://grace.jpl.nasa.gov/data/get-data/">https://grace.jpl.nasa.gov/data/get-data/</ext-link>.</p>
</sec>
<sec id="s8">
<title>Author Contributions</title>
<p>RD and VF conceived and designed the experiment. RD processed the datasets. CN and FC edited the final version of the manuscript. RD and BY wrote the original draft, and all authors contributed to writing the manuscript.</p>
</sec>
<sec id="s9">
<title>Funding</title>
<p>This study was supported by the National Key R&#x26;D Program (grant no. 2018YFA0605402).</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s11">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>The authors are grateful to all the dataset providers, as mentioned in <xref ref-type="sec" rid="s3-1">Section 3.1</xref>, on which the analysis in this manuscript is based. Bin Yong acknowledges the support from China&#x2019;s National Key R&#x26;D Program (grant no. 2018YFA0605402). Finally, we acknowledge the Associate Editor and two reviewers for their remarks which helped improve the quality of this manuscript.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Abeare</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2009</year>). <source>Comparisons of Boosted Regression Tree, GLM and GAM Performance in the Standardization of Yellowfin Tuna Catch-Rate Data from the Gulf of Mexico Lonline [sic] Fishery</source>. <comment>Ph.D. Thesis</comment>. <publisher-loc>Baton Rouge</publisher-loc>: <publisher-name>Louisiana State University</publisher-name>.</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmed</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sultan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wahr</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>The Use of GRACE Data to Monitor Natural and Anthropogenic Induced Variations in Water Availability across Africa</article-title>. <source>Earth Sci. Rev.</source> <volume>136</volume>, <fpage>289</fpage>&#x2013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1016/j.earscirev.2014.05.009</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahmed</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sultan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Elbayoumi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tissot</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Forecasting GRACE Data over the African Watersheds Using Artificial Neural Networks</article-title>. <source>Remote Sens.</source> <volume>11</volume>, <fpage>1769</fpage>. <pub-id pub-id-type="doi">10.3390/rs11151769</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ardalani-Farsa</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zolfaghari</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Chaotic Time Series Prediction with Residual Analysis Method Using Hybrid Elman-NARX Neural Networks</article-title>. <source>Neurocomputing</source> <volume>73</volume>, <fpage>2540</fpage>&#x2013;<lpage>2553</lpage>. <pub-id pub-id-type="doi">10.1016/j.neucom.2010.06.004</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becker</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Meyssignac</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Xavier</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Cazenave</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Alkama</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Decharme</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Past Terrestrial Water Storage (1980-2008) in the Amazon Basin Reconstructed from GRACE and <italic>In Situ</italic> River Gauging Data</article-title>. <source>Hydrol. Earth Syst. Sci.</source> <volume>15</volume>, <fpage>533</fpage>&#x2013;<lpage>546</lpage>. <pub-id pub-id-type="doi">10.5194/hess-15-533-2011</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Catry</surname>
<given-names>F. X.</given-names>
</name>
<name>
<surname>Rego</surname>
<given-names>F. C.</given-names>
</name>
<name>
<surname>Ba&#xe7;&#xe3;o</surname>
<given-names>F. L.</given-names>
</name>
<name>
<surname>Moreira</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Modeling and Mapping Wildfire Ignition Risk in Portugal</article-title>. <source>Int. J. Wildland Fire</source> <volume>18</volume>, <fpage>921</fpage>&#x2013;<lpage>931</lpage>. <pub-id pub-id-type="doi">10.1071/WF07123</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Long-term Groundwater Storage Variations Estimated in the Songhua River Basin by Using GRACE Products, Land Surface Models, and In-Situ Observations</article-title>. <source>Sci. Total Environ.</source> <volume>649</volume>, <fpage>372</fpage>&#x2013;<lpage>387</lpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2018.08.352</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cunningham</surname>
<given-names>S. C.</given-names>
</name>
<name>
<surname>Thomson</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Mac Nally</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Read</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Baker</surname>
<given-names>P. J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Groundwater Change Forecasts Widespread Forest Dieback across an Extensive Floodplain System</article-title>. <source>Freshw. Biol.</source> <volume>56</volume>, <fpage>1494</fpage>&#x2013;<lpage>1508</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2427.2011.02585.x</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Linage</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Famiglietti</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Randerson</surname>
<given-names>J. T.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Statistical Prediction of Terrestrial Water Storage Changes in the Amazon Basin Using Tropical Pacific and North Atlantic Sea Surface Temperature Anomalies</article-title>. <source>Hydrol. Earth Syst. Sci.</source> <volume>18</volume>, <fpage>2089</fpage>&#x2013;<lpage>2102</lpage>. <pub-id pub-id-type="doi">10.5194/hess-18-2089-2014</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dedman</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Officer</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Clarke</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Reid</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Brophy</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Gbm.auto: A Software Tool to Simplify Spatial Modelling and Marine Protected Area Planning</article-title>. <source>PLOS ONE</source> <volume>12</volume>, <fpage>e0188955</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0188955</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dong</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zuo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Hydrological Alteration of the Upper Yangtze River and its Possible Links with Large-Scale Climate Indices</article-title>. <source>Hydrol. Res.</source> <volume>50</volume>, <fpage>1120</fpage>&#x2013;<lpage>1137</lpage>. <pub-id pub-id-type="doi">10.2166/nh.2019.112</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elith</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Anderson</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Dud&#xed;k</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ferrier</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Guisan</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2006</year>). <article-title>Novel Methods Improve Prediction of Species&#x27; Distributions from Occurrence Data</article-title>. <source>Ecography</source> <volume>29</volume>, <fpage>129</fpage>&#x2013;<lpage>151</lpage>. <pub-id pub-id-type="doi">10.1111/j.2006.0906-7590.04596.x</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Elith</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Leathwick</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>A Working Guide to Boosted Regression Trees</article-title>. <source>J. Anim. Ecol.</source> <volume>77</volume>, <fpage>802</fpage>&#x2013;<lpage>813</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2656.2008.01390.x</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferreira</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Andam-Akorful</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dannouf</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Adu-Afari</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A Multi-Sourced Data Retrodiction of Remotely Sensed Terrestrial Water Storage Changes for West Africa</article-title>. <source>Water</source> <volume>11</volume>, <fpage>401</fpage>. <pub-id pub-id-type="doi">10.3390/w11020401</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferreira</surname>
<given-names>V. G.</given-names>
</name>
<name>
<surname>Yong</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Tourian</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Ndehedehe</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Seitz</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2020a</year>). <article-title>Characterization of the Hydro-Geological Regime of Yangtze River Basin Using Remotely-Sensed and Modeled Products</article-title>. <source>Sci. Total Environ.</source> <volume>718</volume>, <fpage>137354</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2020.137354</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ferreira</surname>
<given-names>V. G.</given-names>
</name>
<name>
<surname>Yong</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Seitz</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Heck</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Grombein</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2020b</year>). <article-title>Introducing an Improved GRACE Global Point-Mass Solution-A Case Study in Antarctica</article-title>. <source>Remote Sens.</source> <volume>12</volume>, <fpage>3197</fpage>. <pub-id pub-id-type="doi">10.3390/rs12193197</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Forootan</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Didova</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Schumacher</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kusche</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Elsaka</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2014a</year>). <article-title>Comparisons of Atmospheric Mass Variations Derived from ECMWF Reanalysis and Operational Fields, over 2003-2011</article-title>. <source>J. Geod.</source> <volume>88</volume>, <fpage>503</fpage>&#x2013;<lpage>514</lpage>. <pub-id pub-id-type="doi">10.1007/s00190-014-0696-x</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Forootan</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Kusche</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Loth</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Schuh</surname>
<given-names>W.-D.</given-names>
</name>
<name>
<surname>Eicker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Awange</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2014b</year>). <article-title>Multivariate Prediction of Total Water Storage Changes over West Africa from Multi-Satellite Data</article-title>. <source>Surv. Geophys.</source> <volume>35</volume>, <fpage>913</fpage>&#x2013;<lpage>940</lpage>. <pub-id pub-id-type="doi">10.1007/s10712-014-9292-0</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Additive Logistic Regression: A Statistical View of Boosting (With Discussion and a Rejoinder by the Authors)</article-title>. <source>Ann. Stat.</source> <volume>28</volume>, <fpage>337</fpage>&#x2013;<lpage>407</lpage>. <pub-id pub-id-type="doi">10.1214/aos/1016218223</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Stochastic Gradient Boosting</article-title>. <source>Comput. Stat. Data Analysis</source> <volume>38</volume>, <fpage>367</fpage>&#x2013;<lpage>378</lpage>. <pub-id pub-id-type="doi">10.1016/S0167-9473(01)00065-2</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2009</year>). <source>The Elements of Statistical Learning</source>. <comment>Springer Series in Statistics</comment>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer New York</publisher-name>. <pub-id pub-id-type="doi">10.1007/978-0-387-84858-7</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Landerer</surname>
<given-names>F. W.</given-names>
</name>
<name>
<surname>Swenson</surname>
<given-names>S. C.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Accuracy of Scaled GRACE Terrestrial Water Storage Estimates</article-title>. <source>Water Resour. Res.</source> <volume>48</volume>, <fpage>W04531</fpage>. <pub-id pub-id-type="doi">10.1029/2011WR011453</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leathwick</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Elith</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Francis</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Variation in Demersal Fish Species Richness in the Oceans Surrounding New Zealand: An Analysis Using Boosted Regression Trees</article-title>. <source>Mar. Ecol. Prog. Ser.</source> <volume>321</volume>, <fpage>267</fpage>&#x2013;<lpage>281</lpage>. <pub-id pub-id-type="doi">10.3354/meps321267</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leathwick</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Elith</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chadderton</surname>
<given-names>W. L.</given-names>
</name>
<name>
<surname>Rowe</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Dispersal, Disturbance and the Contrasting Biogeographies of New Zealand&#x27;s Diadromous and Non-diadromous Fish Species</article-title>. <source>J. Biogeogr.</source> <volume>35</volume>, <fpage>1481</fpage>&#x2013;<lpage>1497</lpage>. <pub-id pub-id-type="doi">10.1111/j.1365-2699.2008.01887.x</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kusche</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chao</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>L&#xf6;cher</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Long-term (1979-present) Total Water Storage Anomalies over the Global Land Derived by Reconstructing GRACE Data</article-title>. <source>Geophys. Res. Lett.</source> <volume>48</volume>, <fpage>e2021GL093492</fpage>. <pub-id pub-id-type="doi">10.1029/2021GL093492</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Long</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Longuevergne</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Drought and Flood Monitoring for a Large Karst Plateau in Southwest China Using Extended GRACE Data</article-title>. <source>Remote Sens. Environ.</source> <volume>155</volume>, <fpage>145</fpage>&#x2013;<lpage>160</lpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2014.08.006</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Long</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wada</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Deriving Scaling Factors Using a Global Hydrological Model to Restore GRACE Total Water Storage Changes for China&#x27;s Yangtze River Basin</article-title>. <source>Remote Sens. Environ.</source> <volume>168</volume>, <fpage>177</fpage>&#x2013;<lpage>193</lpage>. <pub-id pub-id-type="doi">10.1016/j.rse.2015.07.003</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Long</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Scanlon</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Wada</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Singh</surname>
<given-names>V. P.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Have Grace Satellites Overestimated Groundwater Depletion in the Northwest India Aquifer?</article-title> <source>Sci. Rep.</source> <volume>6</volume>, <fpage>24398</fpage>. <pub-id pub-id-type="doi">10.1038/srep24398</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Temporal Evolution of Regional Drought Detected from GRACE TWSA and CCI SM in Yunnan Province, China</article-title>. <source>Remote Sens.</source> <volume>9</volume>, <fpage>1124</fpage>. <pub-id pub-id-type="doi">10.3390/rs9111124</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mo</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Variations in Water Storage in China over Recent Decades from GRACE Observations and GLDAS</article-title>. <source>Nat. Hazards Earth Syst. Sci.</source> <volume>16</volume>, <fpage>469</fpage>&#x2013;<lpage>482</lpage>. <pub-id pub-id-type="doi">10.5194/nhess-16-469-2016</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moriasi</surname>
<given-names>D. N.</given-names>
</name>
<name>
<surname>Arnold</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Van Liew</surname>
<given-names>M. W.</given-names>
</name>
<name>
<surname>Bingner</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Harmel</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Veith</surname>
<given-names>T. L.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Model Evaluation Guidelines for Systematic Quantification of Accuracy in Watershed Simulations</article-title>. <source>Trans. ASABE</source> <volume>50</volume>, <fpage>885</fpage>&#x2013;<lpage>900</lpage>. <pub-id pub-id-type="doi">10.13031/2013.23153</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mukherjee</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ramachandran</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Prediction of GWL with the Help of GRACE TWS for Unevenly Spaced Time Series Data in India : Analysis of Comparative Performances of SVR, ANN and LRM</article-title>. <source>J. Hydrol.</source> <volume>558</volume>, <fpage>647</fpage>&#x2013;<lpage>658</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2018.02.005</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mukhopadhyay</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Application of Visual, Statistical and Artificial Neural Network Methods in the Differentiation of Water from the Exploited Aquifers in Kuwait</article-title>. <source>Hydrogeol. J.</source> <volume>11</volume>, <fpage>343</fpage>&#x2013;<lpage>356</lpage>. <pub-id pub-id-type="doi">10.1007/s10040-003-0257-5</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naghibi</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Pourghasemi</surname>
<given-names>H. R.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A Comparative Assessment between Three Machine Learning Models and Their Performance Comparison by Bivariate and Multivariate Statistical Methods in Groundwater Potential Mapping</article-title>. <source>Water Resour. Manage</source> <volume>29</volume>, <fpage>5217</fpage>&#x2013;<lpage>5236</lpage>. <pub-id pub-id-type="doi">10.1007/s11269-015-1114-8</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naghibi</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Pourghasemi</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Dixon</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>GIS-based Groundwater Potential Mapping Using Boosted Regression Tree, Classification and Regression Tree, and Random Forest Machine Learning Models in Iran</article-title>. <source>Environ. Monit. Assess.</source> <volume>188</volume>, <fpage>44</fpage>. <pub-id pub-id-type="doi">10.1007/s10661-015-5049-6</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ndehedehe</surname>
<given-names>C. E.</given-names>
</name>
<name>
<surname>Ferreira</surname>
<given-names>V. G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Assessing Land Water Storage Dynamics over South America</article-title>. <source>J. Hydrol.</source> <volume>580</volume>, <fpage>124339</fpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2019.124339</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nolan</surname>
<given-names>B. T.</given-names>
</name>
<name>
<surname>Fienen</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Lorenz</surname>
<given-names>D. L.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>A Statistical Learning Framework for Groundwater Nitrate Models of the Central Valley, California, USA</article-title>. <source>J. Hydrology</source> <volume>531</volume>, <fpage>902</fpage>&#x2013;<lpage>911</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2015.10.025</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pourghasemi</surname>
<given-names>H. R.</given-names>
</name>
<name>
<surname>Rahmati</surname>
<given-names>O.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Prediction of the Landslide Susceptibility: Which Algorithm, Which Precision?</article-title> <source>CATENA</source> <volume>162</volume>, <fpage>177</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1016/j.catena.2017.11.022</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rahman</surname>
<given-names>A. T. M. S.</given-names>
</name>
<name>
<surname>Hosono</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Quilty</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Das</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Basak</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Multiscale Groundwater Level Forecasting: Coupling New Machine Learning Approaches with Wavelet Transforms</article-title>. <source>Adv. Water Resour.</source> <volume>141</volume>, <fpage>103595</fpage>. <pub-id pub-id-type="doi">10.1016/j.advwatres.2020.103595</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reager</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>B. F.</given-names>
</name>
<name>
<surname>Famiglietti</surname>
<given-names>J. S.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>River Basin Flood Potential Inferred Using GRACE Gravity Observations at Several Months Lead Time</article-title>. <source>Nat. Geosci.</source> <volume>7</volume>, <fpage>588</fpage>&#x2013;<lpage>592</lpage>. <pub-id pub-id-type="doi">10.1038/ngeo2203</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Famiglietti</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Seneviratne</surname>
<given-names>S. I.</given-names>
</name>
<name>
<surname>Viterbo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Holl</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2004a</year>). <article-title>Basin Scale Estimates of Evapotranspiration Using GRACE and Other Observations</article-title>. <source>Geophys. Res. Lett.</source> <volume>31</volume>, <fpage>L20504</fpage>. <pub-id pub-id-type="doi">10.1029/2004GL020873</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Houser</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Jambor</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Gottschalck</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mitchell</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Meng</surname>
<given-names>C.-J.</given-names>
</name>
<etal/>
</person-group> (<year>2004b</year>). <article-title>The Global Land Data Assimilation System</article-title>. <source>Bull. Amer. Meteor. Soc.</source> <volume>85</volume>, <fpage>381</fpage>&#x2013;<lpage>394</lpage>. <pub-id pub-id-type="doi">10.1175/BAMS-85-3-381</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Velicogna</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Famiglietti</surname>
<given-names>J. S.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Satellite-based Estimates of Groundwater Depletion in India</article-title>. <source>Nature</source> <volume>460</volume>, <fpage>999</fpage>&#x2013;<lpage>1002</lpage>. <pub-id pub-id-type="doi">10.1038/nature08238</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Famiglietti</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Wiese</surname>
<given-names>D. N.</given-names>
</name>
<name>
<surname>Reager</surname>
<given-names>J. T.</given-names>
</name>
<name>
<surname>Beaudoing</surname>
<given-names>H. K.</given-names>
</name>
<name>
<surname>Landerer</surname>
<given-names>F. W.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Emerging Trends in Global Freshwater Availability</article-title>. <source>Nature</source> <volume>557</volume>, <fpage>651</fpage>&#x2013;<lpage>659</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-018-0123-1</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Scanlon</surname>
<given-names>B. R.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Save</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wiese</surname>
<given-names>D. N.</given-names>
</name>
<name>
<surname>Landerer</surname>
<given-names>F. W.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Global Evaluation of New GRACE Mascon Products for Hydrologic Applications</article-title>. <source>Water Resour. Res.</source> <volume>52</volume>, <fpage>9412</fpage>&#x2013;<lpage>9429</lpage>. <pub-id pub-id-type="doi">10.1002/2016WR019494</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Schapire</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>2003</year>). <source>The Boosting Approach to Machine Learning: An Overview</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Springer</publisher-name>, <fpage>149</fpage>&#x2013;<lpage>171</lpage>. <comment>chap. 9</comment>. <pub-id pub-id-type="doi">10.1007/978-0-387-21579-2_9</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schneider</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Becker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Finger</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Meyer-Christoffer</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ziese</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rudolf</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>GPCC&#x27;s New Land Surface Precipitation Climatology Based on Quality-Controlled <italic>In Situ</italic> Data and its Role in Quantifying the Global Water Cycle</article-title>. <source>Theor. Appl. Climatol.</source> <volume>115</volume>, <fpage>15</fpage>&#x2013;<lpage>40</lpage>. <pub-id pub-id-type="doi">10.1007/s00704-013-0860-x</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharafati</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Asadollah</surname>
<given-names>S. B. H. S.</given-names>
</name>
<name>
<surname>Neshat</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A New Artificial Intelligence Strategy for Predicting the Groundwater Level over the Rafsanjan Aquifer in Iran</article-title>. <source>J. Hydrol.</source> <volume>591</volume>, <fpage>125468</fpage>. <pub-id pub-id-type="doi">10.1016/j.jhydrol.2020.125468</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Smith</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Sardeshmukh</surname>
<given-names>P. D.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>The Effect of ENSO on the Intraseasonal Variance of Surface Temperatures in Winter</article-title>. <source>Int. J. Climatol.</source> <volume>20</volume>, <fpage>1543</fpage>&#x2013;<lpage>1557</lpage>. <pub-id pub-id-type="doi">10.1002/1097-0088(20001115)20:13&#x3c;1543::AID-JOC579&#x3e;3.0.CO;2-A</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Drought Evaluation Using the GRACE Terrestrial Water Storage Deficit over the Yangtze River Basin, China</article-title>. <source>Sci. Total Environ.</source> <volume>634</volume>, <fpage>727</fpage>&#x2013;<lpage>738</lpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2018.03.292</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Syed</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>Famiglietti</surname>
<given-names>J. S.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Rodell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Seneviratne</surname>
<given-names>S. I.</given-names>
</name>
<name>
<surname>Viterbo</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Total Basin Discharge for the Amazon and Mississippi River Basins from GRACE and a Land-Atmosphere Water Balance</article-title>. <source>Geophys. Res. Lett.</source> <volume>32</volume>, <fpage>L24404</fpage>. <pub-id pub-id-type="doi">10.1029/2005GL024851</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Velicogna</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kimball</surname>
<given-names>J. S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Increasing Subsurface Water Storage in Discontinuous Permafrost Areas of the Lena River Basin, Eurasia, Detected from GRACE</article-title>. <source>Geophys. Res. Lett.</source> <volume>39</volume>, <fpage>1</fpage>&#x2013;<lpage>5</lpage>. <pub-id pub-id-type="doi">10.1029/2012GL051623</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vilar</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Woolford</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Martell</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Mart&#xed;n</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>A Model for Predicting Human-Caused Wildfire Occurrence in the Region of Madrid, Spain</article-title>. <source>Int. J. Wildland Fire</source> <volume>19</volume>, <fpage>325</fpage>&#x2013;<lpage>337</lpage>. <pub-id pub-id-type="doi">10.1071/WF09030</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vishwakarma</surname>
<given-names>B. D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Monitoring Droughts from GRACE</article-title>. <source>Front. Environ. Sci.</source> <volume>8</volume>, <fpage>1</fpage>&#x2013;<lpage>6</lpage>. <pub-id pub-id-type="doi">10.3389/fenvs.2020.584690</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Developing a Long Short-Term Memory (LSTM)-based Model for Reconstructing Terrestrial Water Storage Variations from 1982 to 2016 in the Tarim River Basin, Northwest China</article-title>. <source>Remote Sens.</source> <volume>13</volume>, <fpage>889</fpage>&#x2013;<lpage>918</lpage>. <pub-id pub-id-type="doi">10.3390/rs13050889</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wilby</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Abrahart</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Dawson</surname>
<given-names>C. W.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Detection of Conceptual Model Rainfall-Runoff Processes inside an Artificial Neural Network</article-title>. <source>Hydrol. Sci. J.</source> <volume>48</volume>, <fpage>163</fpage>&#x2013;<lpage>181</lpage>. <pub-id pub-id-type="doi">10.1623/hysj.48.2.163.44699</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>S.-c.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Teng</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Reconstructing Terrestrial Water Storage Variations from 1980 to 2015 in the Beishan Area of China</article-title>. <source>Geofluids</source> <volume>2019</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.1155/2019/3874742</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Schneider</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Becker</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Evaluating the GPCC Full Data Daily Analysis Version 2018 through ETCCDI Indices and Comparison with Station Observations over Mainland of China</article-title>. <source>Theor. Appl. Climatol.</source> <volume>142</volume>, <fpage>835</fpage>&#x2013;<lpage>845</lpage>. <pub-id pub-id-type="doi">10.1007/s00704-020-03352-8</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zaitchik</surname>
<given-names>B. F.</given-names>
</name>
<name>
<surname>Rodell</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Reichle</surname>
<given-names>R. H.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Assimilation of GRACE Terrestrial Water Storage Data into a Land Surface Model: Results for the Mississippi River Basin</article-title>. <source>J. Hydrometeorol.</source> <volume>9</volume>, <fpage>535</fpage>&#x2013;<lpage>548</lpage>. <pub-id pub-id-type="doi">10.1175/2007JHM951.1</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Werner</surname>
<given-names>A. D.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>GRACE-based Hydrological Drought Evaluation of the Yangtze River Basin, China</article-title>. <source>J. Hydrometeorol.</source> <volume>17</volume>, <fpage>811</fpage>&#x2013;<lpage>828</lpage>. <pub-id pub-id-type="doi">10.1175/JHM-D-15-0084.1</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>