<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2023.1295874</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>A method for estimating particulate organic carbon at the sea surface based on geodetector and machine learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Wu</surname>
<given-names>Huisheng</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Cui</surname>
<given-names>Long</given-names>
</name>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2508599"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wang</surname>
<given-names>Lejie</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/resources/"/>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sun</surname>
<given-names>Ruixue</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zheng</surname>
<given-names>Zhi</given-names>
</name>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<institution>College of Oceanography and Space Informatics, China University of Petroleum (East China)</institution>, <addr-line>Qingdao, Shandong</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Haiyong Zheng, Ocean University of China, China</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Qibin Lao, Guangdong Ocean University, China</p>
<p>Hui Zheng, Henan University, China</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Long Cui, <email xlink:href="mailto:z22160008@s.upc.edu.cn">z22160008@s.upc.edu.cn</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>28</day>
<month>12</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>10</volume>
<elocation-id>1295874</elocation-id>
<history>
<date date-type="received">
<day>17</day>
<month>09</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>11</day>
<month>12</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Wu, Cui, Wang, Sun and Zheng</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Wu, Cui, Wang, Sun and Zheng</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>Particulate organic carbon (POC) is an essential component of the carbon pump within marine organisms. Exploring estimation methods for POC holds substantial significance for understanding the marine carbon cycle. In this study, we investigated the spatial heterogeneity of 30 factors and POC concentrations using geodetector to account for nonlinearity, diversity, and complexity. Ultimately, 20 factors including sea surface temperature, sea surface salinity, and chlorophyll-a were selected as modeling variables. Six machine learning models&#x2014;backpropagation neural network, convolutional neural network, attention-based neural network, random forest (RF), adaptive boosting, and extreme gradient boosting were used to compare their performance. The results indicate that among the six machine learning algorithms, RF exhibits the strongest performance, with a root mean square error of 0.11 [log(mg/m<sup>3</sup>)] and an average percentage deviation of 2.73%. Global annual average sea surface POC concentrations were estimated for 2007 and compared to NASA&#x2019;s POC product. The outcomes indicate that the RF model-based estimation method displays enhanced accuracy in estimating POC concentrations within intricate coastal environments, while the backpropagation neural network performed better in estimating POC concentrations in open ocean areas. Leveraging the RF model, global sea surface POC concentrations were estimated for the years 2007 through 2016, enabling a spatiotemporal analysis. The analysis unveils heightened POC concentrations in coastal regions and lower levels in open ocean areas. Furthermore, POC concentrations were greater in high-latitude regions compared to mid and low latitude counterparts. In conclusion, the global sea surface POC product in this study exhibits heightened spatial resolution and improved data completeness in contrast to other products. It enhances the accuracy of conventional POC estimation methods, particularly within coastal regions.</p>
</abstract>
<kwd-group>
<kwd>particulate organic carbon</kwd>
<kwd>machine learning</kwd>
<kwd>geodetector</kwd>
<kwd>ocean remote sensing</kwd>
<kwd>random forest</kwd>
</kwd-group>
<counts>
<fig-count count="12"/>
<table-count count="3"/>
<equation-count count="6"/>
<ref-count count="69"/>
<page-count count="17"/>
<word-count count="8361"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Ocean Observation</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Marine particulate organic carbon (POC) refers to the organic particles in the ocean that are generated through the metabolic processes of marine organisms, resuspension of sediments, and input from land sources. These particles include phytoplankton cells, bacteria, and organic debris, among other substances (<xref ref-type="bibr" rid="B7">Brewin et&#xa0;al., 2021</xref>). POC accounts for approximately 10% of ocean organic carbon reservoirs (<xref ref-type="bibr" rid="B19">Jahnke and Richard, 1996</xref>; <xref ref-type="bibr" rid="B33">Loisel et&#xa0;al., 2002</xref>). Although POC accounts for a small proportion of the open ocean, it is an essential component of biological pumps with a high carbon turnover rate and significant carbon flux (<xref ref-type="bibr" rid="B43">Sarmiento, 2006</xref>; <xref ref-type="bibr" rid="B21">Kim et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B24">Lao et&#xa0;al., 2023a</xref>). Therefore, analyzing spatiotemporal variations in the stock and flux of POC in the ocean is of great significance for studying the marine carbon cycle. Remote sensing data offer significant advantages in terms of temporal and spatial resolution (<xref ref-type="bibr" rid="B47">Sawaya et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B11">Devi et&#xa0;al., 2015</xref>). By utilizing remote sensing techniques, it is possible to provide additional methods for estimating the POC stock in the ocean (<xref ref-type="bibr" rid="B55">Stramski et&#xa0;al., 1999</xref>). POC does not possess optical activity, making it challenging to directly retrieve POC information from remote sensing signals (<xref ref-type="bibr" rid="B60">Wang et&#xa0;al., 2017</xref>). Researchers, both domestically and internationally, have conducted a series of studies on the factors influencing POC and found correlations between POC and inherent optical properties (IOPs), apparent optical properties (AOPs), and water constituents (<xref ref-type="bibr" rid="B55">Stramski et&#xa0;al., 1999</xref>; <xref ref-type="bibr" rid="B54">Stramski et&#xa0;al., 2008</xref>). Based on these findings, scientists proposed a range of POC retrieval algorithms.</p>
<p>
<xref ref-type="bibr" rid="B55">Stramski et&#xa0;al. (1999)</xref> were the first to estimate the distribution of POC using the IOPs of water. Based on measured POC data, they established an empirical relationship between POC and the particle backscattering coefficient (bbp). This relationship was then used to quantitatively estimate POC concentrations in the Southern Ocean (<xref ref-type="bibr" rid="B55">Stramski et&#xa0;al., 1999</xref>). <xref ref-type="bibr" rid="B32">Loisel et&#xa0;al. (2001)</xref> discovered a near-linear relationship between POC and bbp in the Southern Ocean. Based on this relationship, they derived the global spatial distribution and seasonal variations of POC using bbp (<xref ref-type="bibr" rid="B32">Loisel et&#xa0;al., 2001</xref>). According to the measured POC data, <xref ref-type="bibr" rid="B16">Gardner et&#xa0;al. (2006)</xref> established an empirical relationship between the particle attenuation coefficient (cp) and POC. Using this relationship, they developed a Two-Step algorithm (<xref ref-type="bibr" rid="B16">Gardner et&#xa0;al., 2006</xref>). However, accurately deducing IOPs from AOPs is crucial for a POC retrieval model based on IOPs (<xref ref-type="bibr" rid="B20">Jiang et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B18">Hayley et&#xa0;al., 2017</xref>; <xref ref-type="bibr" rid="B31">Liu et&#xa0;al., 2021</xref>).</p>
<p>In addition, some algorithms directly estimate POC based on AOPs. For instance, <xref ref-type="bibr" rid="B54">Stramski et&#xa0;al. (2008)</xref> proposed a blue-to-green band ratio algorithm based on the relationship between POC concentrations and remote sensing reflectance (Rrs) in the blue and green bands (<xref ref-type="bibr" rid="B54">Stramski et&#xa0;al., 2008</xref>). Currently, the NASA standard POC algorithm belongs to this category. <xref ref-type="bibr" rid="B41">O'Reilly and Werdell (2019)</xref> proposed a maximum band ratio-OCx (MBR-OCx) algorithm for chlorophyll estimation. <xref ref-type="bibr" rid="B53">Stramski et&#xa0;al. (2022)</xref> tested the performance of the Maximum Band Ratio for POC estimation (<xref ref-type="bibr" rid="B40">O'Reilly, 2000</xref>; <xref ref-type="bibr" rid="B41">O'Reilly and Werdell, 2019</xref>; <xref ref-type="bibr" rid="B53">Stramski et&#xa0;al., 2022</xref>). <xref ref-type="bibr" rid="B28">Le et&#xa0;al. (2017)</xref> established a POC estimation method using a color index (CI) based on satellite Rrs data and matched POC measurements (<xref ref-type="bibr" rid="B28">Le et&#xa0;al., 2017</xref>). <xref ref-type="bibr" rid="B50">Son et&#xa0;al. (2009)</xref> proposed the estimation of POC using the normalized difference carbon index (NDCI) inspired by the normalized difference vegetation index. The results showed high accuracy (R<sup>2</sup> = 0.97, N=58). Furthermore, <xref ref-type="bibr" rid="B50">Son et&#xa0;al. (2009)</xref> introduced the maximum normalized difference carbon index (MNDCI) based on the NDCI, demonstrating even higher accuracy than the previous NDCI (<xref ref-type="bibr" rid="B50">Son et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B60">Wang et&#xa0;al., 2017</xref>). The algorithms mentioned above are suitable for open-ocean Type I waters, whereas the others are more suitable for coastal Type II waters (<xref ref-type="bibr" rid="B39">Morel and Prieur, 1977</xref>). Several scholars have comprehensively tested the algorithms above and developed a series of hybrid algorithms. <xref ref-type="bibr" rid="B53">Stramski et&#xa0;al. (2022)</xref> combined the band ratio difference index (BRDI) algorithm with the MBR-OC4 algorithm based on POC concentration. The final hybrid algorithm achieved good accuracy in both Type I and Type II waters, significantly improving the universality of POC estimation algorithms. <xref ref-type="bibr" rid="B8">Cai et&#xa0;al. (2022)</xref> developed a hybrid algorithm for the East China Sea based on the CI and band ratio algorithms. Using this algorithm, they conducted a long-term time-series estimation and achieved satisfactory accuracy (<xref ref-type="bibr" rid="B8">Cai et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B53">Stramski et&#xa0;al., 2022</xref>).</p>
<p>Owing to the improved fitting capability of machine learning for nonlinear data, its application in water color remote sensing has become increasingly widespread. Scholars have already explored the use of machine learning methods for estimating POC. <xref ref-type="bibr" rid="B31">Liu et&#xa0;al. (2021)</xref> trained three machine learning models: extreme gradient boosting (XGBoost), support vector machine (SVM), and Artificial Neural Networks (ANN). They compared these models with the traditional blue-to-green band ratio algorithm for POC estimation. The results showed that the performance of the machine learning algorithms was superior to that of traditional algorithms. Additionally, machine learning algorithms better estimate the POC in marginal seas and optically complex estuarine waters (<xref ref-type="bibr" rid="B31">Liu et&#xa0;al., 2021</xref>). <xref ref-type="bibr" rid="B44">Sauz&#xe8;de et&#xa0;al. (2016)</xref> developed the &#x201c;Satellite Ocean-Color merged with Argo data to infer bio-optical properties to depth&#x201d; (SOCA) method, a neural network-based method trained using the Biogeochemical-Argo database, for estimating the vertical distribution of bbp. SOCA was improved by <xref ref-type="bibr" rid="B45">Sauz&#xe8;de et&#xa0;al. (2020)</xref>, and the new SOCA2020 model improved the accuracy of POC estimation and additionally estimated chlorophyll-a (<xref ref-type="bibr" rid="B46">Sauz&#xe8;de et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B45">Sauz&#xe8;de et&#xa0;al., 2020</xref>). However, owing to the complex optical conditions in coastal areas, the distribution of POC exhibits significant spatial heterogeneity, which results in uncertainty in POC estimation, even when using machine learning methods.</p>
<p>Geodetector is a novel statistical method for detecting spatial heterogeneity and identifying the underlying driving factors. This approach does not assume linearity and can be used to measure spatial differentiation, detect explanatory factors, or analyze the interactions between variables. It has been applied in various fields of the natural and social sciences (<xref ref-type="bibr" rid="B61">Wang and Xu, 2017</xref>). In this study, to improve the performance of machine learning in estimating the global ocean POC, geodetector was used to detect the spatial correlation between POC and 30 factors. Six machine learning models were trained: backpropagation neural network (BPNN), convolutional neural network (CNN), attention-based neural network (ABNN), random forest (RF), adaptive boosting (AdaBoost), and extreme gradient boosting (XGBoost). The performances of these models were compared and evaluated. This study estimated the annual average surface POC concentration globally from 2007 to 2017 and compared it with NASA&#x2019;s POC product. This study contributes to the development of global high-precision POC products by addressing the uncertainty caused by the significant spatial heterogeneity of POC in coastal areas.</p>
</sec>
<sec id="s2" sec-type="materials|methods">
<label>2</label>
<title>Materials and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>
<italic>In situ</italic> data</title>
<p>This study utilized data from three publicly available datasets: 1) The NASA Bio-Optical Marine Algorithm Dataset, which is a global, high-quality dataset for <italic>in situ</italic> bio-optical measurements; it is used to develop ocean color algorithms and validate satellite products (<xref ref-type="bibr" rid="B62">Werdell and Bailey, 2005</xref>). 2) The SeaWiFS Bio-optical Archive and Storage System (SeaBASS) website (<ext-link ext-link-type="uri" xlink:href="https://seabass.gsfc.nasa.gov/">https://seabass.gsfc.nasa.gov/</ext-link>) provides access to the <italic>in situ</italic> POC measurement data. SeaBASS is an oceanic and atmospheric measurement database maintained by the NASA Ocean Biology Processing Group; it collects <italic>in situ</italic> measurement data from various global cruise missions and observation sites (<xref ref-type="bibr" rid="B62">Werdell and Bailey, 2005</xref>). 3) <xref ref-type="bibr" rid="B35">Martiny et&#xa0;al. (2014)</xref> collected 60,811 <italic>in situ</italic> data points from 70 global cruise missions (<xref ref-type="bibr" rid="B35">Martiny et&#xa0;al., 2014</xref>). To establish a global surface POC estimation model in their study, the downloaded POC data were standardized, and data at depths of less than 20 m were retained as shallow surface POC concentrations. In cases where multiple measurements were available for the same spatiotemporal coordinates, the average value was considered the measured POC value for that particular point. In total, 21,955 surface POC data points were obtained.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>Matching of satellite and reanalysis data with <italic>in situ</italic> data</title>
<p>Moderate Resolution Imaging Spectroradiometer (MODIS) data was downloaded from the NASA OCEAN COLOR website (<ext-link ext-link-type="uri" xlink:href="https://oceancolor.gsfc.nasa.gov/">https://oceancolor.gsfc.nasa.gov/</ext-link>), and remote sensing reanalysis data from multiple databases downloaded from the Copernicus Marine Service (<ext-link ext-link-type="uri" xlink:href="https://marine.copernicus.eu/">https://marine.copernicus.eu/</ext-link>) (<xref ref-type="bibr" rid="B27">Lavergne et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B38">Merchant et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B17">Good et&#xa0;al., 2020</xref>). The statistical information on the remote sensing and reanalysis data is presented in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S1</bold>
</xref>. According to the collected <italic>in situ</italic> POC measurement data, remote sensing, and reanalysis data covering 2007 to 2017 were used. The temporal resolution was standardized at monthly intervals. The ArcGIS mapping tool was used to match the POC measurement data with satellite data using a monthly time window, which reduces the time lag in the correlation between POC and influencing factors and improves the stability of the matching results (<xref ref-type="bibr" rid="B4">Bonelli et&#xa0;al., 2022</xref>). Finally, 14,067 matched points were obtained for the 2007&#x2013;2017 period. The geographic distribution of the matching points is shown in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>. The maximum POC concentration observed was 4743 mg/m<sup>3</sup>, the minimum was 1.45 mg/m<sup>3</sup>, and the average was 156.59 mg/m<sup>3</sup>.</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>Geographic distribution of matching points for particulate organic carbon (POC) and remote sensing data, where the color of the point represents the magnitude of the POC concentration.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g001.tif"/>
</fig>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Dataset segmentation</title>
<p>Suspended particulate matter (SPM) refers to the solid particles suspended in water, including organic and inorganic particles. Therefore, the ratio of POC to SPM (POC/SPM) can be used to measure the contribution of organic particles to total suspended particles (<xref ref-type="bibr" rid="B54">Stramski et&#xa0;al., 2008</xref>; <xref ref-type="bibr" rid="B63">Wo&#x17a;niak et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B56">Tran et&#xa0;al., 2019</xref>). According to the POC/SPM ratio, waters can be classified into three types (<xref ref-type="bibr" rid="B63">Wo&#x17a;niak et&#xa0;al., 2010</xref>): if POC/SPM&lt; 0.06, the particles in the water are predominantly mineral-based; if POC/SPM &gt; 0.25, the particles in the water are predominantly organic-based; if 0.06&lt; POC/SPM&lt; 0.25, it is considered a mixed water. This study compiled the POC concentration ranges for the three types of waters in the dataset, as shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref> and illustrated in the box plot in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>.</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>Statistical data table of measured points for mineral, organic, and mixed water.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Type</th>
<th valign="top" align="center">Mineral</th>
<th valign="top" align="center">Mixed</th>
<th valign="top" align="center">Organic</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">amount</td>
<td valign="top" align="center">947</td>
<td valign="top" align="center">12162</td>
<td valign="top" align="center">958</td>
</tr>
<tr>
<td valign="top" align="center">average(mg/m<sup>3</sup>)</td>
<td valign="top" align="center">31.06</td>
<td valign="top" align="center">42.14</td>
<td valign="top" align="center">296.23</td>
</tr>
<tr>
<td valign="top" align="center">median(mg/m<sup>3</sup>)</td>
<td valign="top" align="center">23.20</td>
<td valign="top" align="center">30.60</td>
<td valign="top" align="center">220.09</td>
</tr>
<tr>
<td valign="top" align="center">min(mg/m<sup>3</sup>)</td>
<td valign="top" align="center">1.46</td>
<td valign="top" align="center">22.12</td>
<td valign="top" align="center">93.51</td>
</tr>
<tr>
<td valign="top" align="center">max(mg/m<sup>3</sup>)</td>
<td valign="top" align="center">428.58</td>
<td valign="top" align="center">2207.18</td>
<td valign="top" align="center">4743.84</td>
</tr>
<tr>
<td valign="top" align="center">SD*</td>
<td valign="top" align="center">1.06</td>
<td valign="top" align="center">0.41</td>
<td valign="top" align="center">9.96</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>* SD, Standard Deviation.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>
<bold>(A)</bold> Statistics of the particulate organic carbon concentration ranges of organic water, mineral water, and mixed water in the dataset; <bold>(B)</bold> Statistics of the number of measured data belonging to the three types of waters in the training, validation, and test datasets.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g002.tif"/>
</fig>
<p>As shown in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, there were 947 observations of mineral water type in the dataset, with an average POC concentration of 31.06 mg/m<sup>3</sup> and a median of 23.20 mg/m<sup>3</sup>. For the mixed water type, there were 12,162 observations with an average POC concentration of 42.14 mg/m<sup>3</sup> and a median of 30.60 mg/m<sup>3</sup>. Finally, for the organic water type, there were 958 observations with an average POC concentration of 296.23 mg/m<sup>3</sup> and a median of 220.09 mg/m<sup>3</sup>. The standard error of POC for all three water types was less than 10 mg/m<sup>3</sup>, indicating a relatively concentrated distribution of data within each group. From <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>, it is evident that there are significant differences among the three groups. Thus, using POC/SPM as a classification criterion for waters effectively represented the differences in POC concentrations within this research dataset.</p>
<p>The dataset was divided into three parts according to the water type to train and evaluate the machine learning model. Each part was further split into training, validation, and test datasets at a ratio of 6:2:2, as shown in <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>. The resulting dataset contained approximately equal proportions of the three water types, with distributions of approximately 7% mineral, 86% mixed, and 7% organic water. This data partitioning method ensures that the POC measured data in the training, validation, and test datasets have similar distribution patterns, which can enhance the effectiveness of the subsequent machine learning model training and evaluation.</p>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Feature selection method</title>
<p>The objective of feature selection is to find the features most relevant to the target variable while excluding those that do not contribute to the model&#x2019;s performance. This is an important step in machine learning that helps reduce data redundancy and noise and improves the model&#x2019;s generalization and interpretability (<xref ref-type="bibr" rid="B31">Liu et&#xa0;al., 2021</xref>). Geodetector was employed to select features for the model. Its theoretical foundation is spatial autocorrelation, which breaks the assumption of independent and identically distributed data in classical statistics (<xref ref-type="bibr" rid="B14">Elhorst, 2010</xref>). The core idea is that if an independent variable significantly influences a dependent variable, the spatial distribution of the independent variable should be similar to that of the dependent variable (<xref ref-type="bibr" rid="B58">Wang and Hu, 2012</xref>). Geodetector is adept at analyzing categorical variables, and for ordinal, ratio, or interval variables, they can also be subjected to appropriate discretization for statistical analysis using geodetector (<xref ref-type="bibr" rid="B9">Cao et&#xa0;al., 2013</xref>). Geodetector consist of four detectors, where the q-value in factor detection represents the extent to which factor explains the spatial variation in attribute POC. The formula used is as <xref ref-type="disp-formula" rid="eq1">Equation 1</xref>:</p>
<disp-formula id="eq1">
<label>(1)</label>
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mtext>q</mml:mtext>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>-</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>S</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>TSS</mml:mtext>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In the equation, WSS represents the within sum of squares, and TSS represents the total sum of squares. Interaction detection assesses whether the interaction between two factors increases or decreases the explanatory power of the dependent variable or whether the effects of these factors on POC are independent of each other.</p>
<p>The spatial distribution of POC at a global scale is uneven. This study utilized geodetector analysis to identify the factors influencing POC concentration, ensuring that the spatial distribution of each factor is similar to that of POC. By validating the spatial correlation between each factor and POC, the model can better represent the spatial distribution characteristics of POC.</p>
</sec>
<sec id="s2_5">
<label>2.5</label>
<title>Machine learning methods</title>
<p>Six machine learning models were trained in this study, including the BPNN, CNN, ABNN, RF, AdaBoost, and XGBoost, to estimate POC on the ocean surface. The performance of each model was tested individually.</p>
<p>ANN consist of a complex network structure that includes an input layer, hidden layer(s), and an output layer (<xref ref-type="bibr" rid="B37">Mcculloch and Pitts, 1990</xref>). The ANN learns and adapts to tasks through continuous training and weights (<xref ref-type="bibr" rid="B29">Lecun et&#xa0;al., 2015</xref>). Popular training algorithms for ANN include backpropagation and gradient descent algorithms. This study&#x2019;s BPNN model consisted of one input layer, ten hidden layers, and one output layer. The first hidden layer contained 89 neurons, and the remaining hidden layers contained 52 neurons. The activation function used between the input and hidden layers and between the output and hidden layers is ReLU. The mean squared error (MSE) was used as a loss function to train the model.</p>
<p>CNN is widely used in image recognition and computer vision tasks. Compared with traditional fully connected neural networks, CNNs have the characteristics of local connectivity and weight sharing, which enable them to effectively extract spatial features from images (<xref ref-type="bibr" rid="B30">Lecun et&#xa0;al., 1998</xref>). The core components of a CNN are the convolutional and pooling layers. The CNN model used in this study consisted of a one-dimensional convolutional layer with one input channel, 16 output channels, and three convolutional kernels. It also included a fully connected layer and an output layer. The ReLU activation function was applied to the nonlinear transformations between each layer. The MSE was used as a loss function to train the model.</p>
<p>The ABNN enhances the model&#x2019;s performance for specific tasks by introducing attention mechanisms; it can automatically learn and select important features from input data and model their correlations using a special weight allocation method (<xref ref-type="bibr" rid="B66">Yang et&#xa0;al., 2019</xref>). In this study, we first used fully connected layers for the feature transformation. The softmax function was used to calculate attention weights, which were used to weigh the features. The weighted features were summed. Similarly, the ReLU activation function was used for nonlinear transformations between layers.</p>
<p>AdaBoost builds a robust classifier by combining multiple weak classifiers, such as decision stumps (decision trees with only one split node) or simple linear classifiers. One characteristic of AdaBoost is that in each training round, it assigns higher weights to samples misclassified in the previous round. This allows weak classifiers to focus on misclassified samples, improving their overall performance and robustness (<xref ref-type="bibr" rid="B15">Freund and Schapire, 1995</xref>). This study used the sklearn library for python to build Adaboost. Decision trees were used as weak regressors, and the total number of iterations in the ensemble was set to 100.</p>
<p>XGBoost is an ensemble learning method based on a gradient-boosting algorithm used to solve classification and regression problems. This is an extension of the boosting algorithm and is known for its efficiency and accuracy, making it widely applicable across various domains. In the context of quantitative watercolor remote sensing, XGBoost is primarily used to predict and estimate water quality parameters of water (<xref ref-type="bibr" rid="B22">Krishnapuram et al., 2016</xref>; <xref ref-type="bibr" rid="B36">Massari et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B69">Zou et&#xa0;al., 2021</xref>). In this study, we implemented XGBoost using sklearn library for python with 100 decision trees in the ensemble and a 0.1 learning rate.</p>
<p>Random Forest (RF) is also an ensemble learning algorithm that combines multiple decision trees for classification and regression. This improves the robustness and generalizability of the model by utilizing random sampling and feature selection to combine multiple decision trees (<xref ref-type="bibr" rid="B6">Breiman, 2001</xref>; <xref ref-type="bibr" rid="B57">Verde et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B49">Shi et&#xa0;al., 2019</xref>).</p>
</sec>
<sec id="s2_6">
<label>2.6</label>
<title>Statistical indicators used for model development, validation and test</title>
<p>This research model performance assessment metrics include coefficient of determination (R2), root mean square error (RMSE), mean absolute percentage error (MAPE), bias, and variance.</p>
<p>R<sup>2</sup> is a statistical measure used to assess the degree to which a model fits the data. The formula is as <xref ref-type="disp-formula" rid="eq2">Equation 2</xref>:</p>
<disp-formula id="eq2">
<label>(2)</label>
<mml:math display="block" id="M2">
<mml:mrow>
<mml:msup>
<mml:mi>R</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>R</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mi>S</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>SSR represents the sum of squares due to regression, and SS represents the sum of squares.</p>
<p>The RMSE is a statistical measure that assesses the error between predicted and true values in a model. The calculation formula is as <xref ref-type="disp-formula" rid="eq3">Equation 3</xref>:</p>
<disp-formula id="eq3">
<label>(3)</label>
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>n</mml:mi>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The MAPE is a statistical measure that assesses the average relative error between a model&#x2019;s predicted and true values. The formula is as <xref ref-type="disp-formula" rid="eq4">Equation 4</xref>:</p>
<disp-formula id="eq4">
<label>(4)</label>
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>P</mml:mi>
<mml:mi>E</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>n</mml:mi>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>|</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
<mml:mo>|</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
<mml:mo>&#xd7;</mml:mo>
<mml:mn>100</mml:mn>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Bias measured the overall error direction of the model. Variance measures the sensitivity and volatility of the model to the samples. The formulas for the bias and variance are as <xref ref-type="disp-formula" rid="eq5">Equations 5</xref>, <xref ref-type="disp-formula" rid="eq6">6</xref>:</p>
<disp-formula id="eq5">
<label>(5)</label>
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mi>B</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>s</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>n</mml:mi>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq6">
<label>(6)</label>
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mi>V</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>n</mml:mi>
</mml:mfrac>
<mml:mo>&#xd7;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mi>m</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
<p>In the formulas above, n represents the number of samples, POC<sub>pred</sub> represents the model&#x2019;s predicted value, POC<sub>true</sub> represents the true value, POC<sub>mean</sub> represents the mean predicted value, and &#x3a3; denotes the summation.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results and discussion</title>
<sec id="s3_1">
<label>3.1</label>
<title>Feature selection</title>
<p>This study utilized factor and interaction detection in a geodetector to select features for pre-model training. The candidate features can be divided into three parts.</p>
<p>The first part comprises the apparent optical properties (AOPs) and their mathematical combination. The AOPs is a product of the interaction between the incident light flux inside the water and the intrinsic optical properties of the water, which varies with the distribution and intensity of the incident light field. These quantities include downward irradiance (Ed), upward irradiance (Eu), water-leaving radiance (LW), Rrs, and the diffuse attenuation coefficients of these variables (<xref ref-type="bibr" rid="B68">Zaneveld and Mobley, 1995</xref>). In this study, the diffuse attenuation coefficient (kd) at 490 nm from the MODIS sensor was collected, as well as the Rrs at wavelengths of 412 nm, 443 nm, 469 nm, 488 nm, 547 nm, 555 nm, 645 nm, and 667 nm. This encompassed the wavelength ranges of red, green, and blue light. Based on the AOPs (mainly Rrs), this study combined band ratios (red-green, red-blue, and blue-green), normalized difference carbon index (NDCI), color index (CI), and band ratio difference index (BRDI) as candidate features.</p>
<p>The second part consists of Inherent optical properties (IOPs), which are solely related to the internal composition of water and do not vary with changing illumination conditions. IOPs are typically used to describe seawater&#x2019;s absorption and scattering processes, including the absorption, scattering, and attenuation coefficients of various components within the water (<xref ref-type="bibr" rid="B34">Maritorena et&#xa0;al., 2010</xref>). POC is an important component of organic particulate matter. Therefore, this study used the backscattering coefficient of particles (bbp) as a candidate feature.</p>
<p>The third part included other features that may be related to POC, including sea surface temperature (SST), sea surface salinity (SSS), Chlorophyll-a (CHL), suspended particulate matter (SPM) concentration, euphotic zone depth (EZD), mixed layer depth (MLD), and photosynthetically active radiation (PAR). These parameters are closely related to marine biological activity and the ocean carbon cycle. Spatial and temporal variations in temperature and salinity directly and indirectly affect marine plants&#x2019; and animals&#x2019; growth, reproduction, distribution, and ecological functions. Chlorophyll concentration is an essential indicator of plant biomass and photosynthetic activity in the ocean. SPM reflects the concentration of particulate matter in water, and the scattering and absorption effects of suspended particles on light can affect the conditions for photosynthesis and growth of marine organisms. EZD and PAR are closely associated with marine plants&#x2019; growth and photosynthetic activity. Changes in MLD can cause variations in the distribution of different nutrients, dissolved oxygen, and light, thereby affecting marine organisms&#x2019; distribution and ecological processes (<xref ref-type="bibr" rid="B5">Bopp et&#xa0;al., 2002</xref>; <xref ref-type="bibr" rid="B43">Sarmiento, 2006</xref>; <xref ref-type="bibr" rid="B13">Doney et al., 2009</xref>). These parameters were all considered candidate features for training the model in this study.</p>
<p>The geodetector analysis was performed using the GD software package developed by Song (<xref ref-type="bibr" rid="B51">Song et&#xa0;al., 2020</xref>). Because the geodetector tool only accepts discrete variables as inputs, it is necessary to discretize the continuous variables for analysis. The GD package supports data discretization. This study used four methods: equal intervals, natural breakpoints, quantiles, and geometric intervals. The selected features were then subjected to factor and interaction detection. The results of factor detection are shown in <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, whereas the results of interaction detection are shown in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>. In factor analysis, considering the important influence of bbp on POC in other scholars&#x2019; research, and the weak correlation between remote sensing reflectance in the purple band and POC (<xref ref-type="bibr" rid="B55">Stramski et&#xa0;al., 1999</xref>; <xref ref-type="bibr" rid="B56">Tran et&#xa0;al., 2019</xref>), we used a threshold of q=0.3 for bbp to determine the strength of its correlation with POC. Specifically, variables with q&lt;0.3 are considered weakly correlated with POC, while variables with q&gt;0.3 are considered strongly correlated with POC. Variables that showed nonlinear attenuation in both factor and interaction detection were excluded. NDCI and CI have two categories: one based on 443 nm and the other based on 488 nm. The factor detection results for these four features had q values greater than 0.3, indicating a significant impact on the POC. In interaction detection, there was no nonlinear or single-factor nonlinear attenuation with other factors. However, building a model using two identical factors is not meaningful. Therefore, in this study, NDCI (443) and CI (443) with lower q values were excluded from the analysis. Finally, 20 variables were selected to train the POC estimation model, and the results are listed in <xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Table S2</bold>
</xref>.</p>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>Geodetector factor detection results.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g003.tif"/>
</fig>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Heat map of geodetector interaction results.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g004.tif"/>
</fig>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Machine learning methods development and validation</title>
<sec id="s3_2_1">
<label>3.2.1</label>
<title>Accuracy of the model on different datasets</title>
<p>The observed dataset was divided into training, validation, and test datasets. These datasets were used for the machine learning model training, hyperparameter tuning, and model performance validation. Hyperparameter tuning was performed using Bayesian optimization, as described by Shahriari and Swersky (<xref ref-type="bibr" rid="B48">Shahriari et&#xa0;al., 2016</xref>).</p>
<p>In this study, the six trained machine learning models were divided into two categories: BPNN, CNN, and ABNN, which are artificial neural networks (ANN), whereas AdaBoost, RF, and XGBoost are ensemble algorithms. These models can achieve high accuracy in multivariate regression tasks and exhibit good fitting performance for nonlinear functions. However, the large differences in data quantities for mineral, mixed, and organic water in the dataset are unfavorable for model training. They may lead to an increase in model variance. To enhance the generalization performance of the models, we applied a logarithmic transformation with a base of 10 to both the observed and estimated POC values. <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref> shows the accuracy of the six machine learning models in estimating the log<sub>10</sub>(POC) for the three datasets. Bold accuracy indicators represent the best performance for the corresponding dataset. Among the six models, the ensemble algorithms outperformed the neural network algorithms. The RF model achieved the best performance with an R<sup>2</sup> of 0.85, RMSE of 0.11 log<sub>10</sub>(mg/m<sup>3</sup>), MAPE of 2.73%, variance of 0.09, and bias of 0.003 on the test dataset. This indicates that the RF model for estimating POC has good fitting and generalization capabilities.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>Model accuracy on training, validation, and test datasets.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" colspan="2" align="left">Dataset</th>
<th valign="middle" align="left">R<sup>2</sup>
</th>
<th valign="middle" align="left">RMSE</th>
<th valign="middle" align="left">MAPE</th>
<th valign="middle" align="left">Variance</th>
<th valign="middle" align="left">bias</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="6" align="center">Training</td>
<td valign="middle" align="left">BPNN</td>
<td valign="middle" align="left">
<bold>0.99</bold>
</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">2.45%</td>
<td valign="middle" align="left">0.97</td>
<td valign="middle" align="left">0.012</td>
</tr>
<tr>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.13</td>
<td valign="middle" align="left">4.58%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">-0.009</td>
</tr>
<tr>
<td valign="middle" align="left">ABNN</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.14</td>
<td valign="middle" align="left">5.67%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">0.029</td>
</tr>
<tr>
<td valign="middle" align="left">AdaBoost</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.14</td>
<td valign="middle" align="left">5.56%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">0.022</td>
</tr>
<tr>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">0.98</td>
<td valign="middle" align="left">
<bold>0.04</bold>
</td>
<td valign="middle" align="left">
<bold>1.02%</bold>
</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">
<bold>0.0004</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">XGboost</td>
<td valign="middle" align="left">0.95</td>
<td valign="middle" align="left">0.07</td>
<td valign="middle" align="left">2.73%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">0.003</td>
</tr>
<tr>
<td valign="middle" rowspan="6" align="center">Validation</td>
<td valign="middle" align="left">BPNN</td>
<td valign="middle" align="left">0.82</td>
<td valign="middle" align="left">0.43</td>
<td valign="middle" align="left">3.27%</td>
<td valign="middle" align="left">0.92</td>
<td valign="middle" align="left">0.003</td>
</tr>
<tr>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">0.80</td>
<td valign="middle" align="left">0.13</td>
<td valign="middle" align="left">4.74%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">-0.012</td>
</tr>
<tr>
<td valign="middle" align="left">ABNN</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">0.14</td>
<td valign="middle" align="left">5.67%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">0.029</td>
</tr>
<tr>
<td valign="middle" align="left">AdaBoost</td>
<td valign="middle" align="left">0.76</td>
<td valign="middle" align="left">0.15</td>
<td valign="middle" align="left">5.76%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">0.022</td>
</tr>
<tr>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">
<bold>0.87</bold>
</td>
<td valign="middle" align="left">
<bold>0.11</bold>
</td>
<td valign="middle" align="left">
<bold>2.61%</bold>
</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">
<bold>-0.001</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">XGboost</td>
<td valign="middle" align="left">0.86</td>
<td valign="middle" align="left">
<bold>0.11</bold>
</td>
<td valign="middle" align="left">3.29%</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">-0.003</td>
</tr>
<tr>
<td valign="middle" rowspan="6" align="center">Test</td>
<td valign="middle" align="left">BPNN</td>
<td valign="middle" align="left">0.79</td>
<td valign="middle" align="left">0.14</td>
<td valign="middle" align="left">3.47%</td>
<td valign="middle" align="left">
<bold>0.08</bold>
</td>
<td valign="middle" align="left">0.004</td>
</tr>
<tr>
<td valign="middle" align="left">CNN</td>
<td valign="middle" align="left">0.78</td>
<td valign="middle" align="left">0.14</td>
<td valign="middle" align="left">4.77%</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">-0.006</td>
</tr>
<tr>
<td valign="middle" align="left">ABNN</td>
<td valign="middle" align="left">0.77</td>
<td valign="middle" align="left">0.14</td>
<td valign="middle" align="left">5.53%</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">0.032</td>
</tr>
<tr>
<td valign="middle" align="left">AdaBoost</td>
<td valign="middle" align="left">0.75</td>
<td valign="middle" align="left">0.15</td>
<td valign="middle" align="left">5.83%</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">0.025</td>
</tr>
<tr>
<td valign="middle" align="left">RF</td>
<td valign="middle" align="left">
<bold>0.85</bold>
</td>
<td valign="middle" align="left">
<bold>0.11</bold>
</td>
<td valign="middle" align="left">
<bold>2.73%</bold>
</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">0.003</td>
</tr>
<tr>
<td valign="middle" align="left">XGboost</td>
<td valign="middle" align="left">0.84</td>
<td valign="middle" align="left">0.12</td>
<td valign="middle" align="left">3.45%</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">
<bold>0.0015</bold>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>BPNN, Backpropagation Neural Network; CNN, Convolutional Neural Network; ABNN, Attention-Based Neural Network; RF, Random Forest; AdaBoost, Adaptive Boosting; XGBoost, eXtreme Gradient Boosting; RMSE, Root Mean Square Error; MAPE, mean absolute percentage error.</p>
</fn>
<fn>
<p>Bold values represent the best performance for the corresponding dataset.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>Normalized residuals were used to evaluate the fit of the statistical model and detect outliers. By observing the distribution of the normalized residuals, we can assess the model&#x2019;s fit and identify outliers, which can help improve the model or clean the data. The normalized residuals of the predictions made by the six models on the test dataset was calculated. <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref> shows a scatterplot comparing the predicted and true values, where each point&#x2019;s color represents the normalized residual&#x2019;s magnitude. It can be visually observed that the BPNN performed the best among the neural network algorithms, with a MAPE of 3.471%. Among the&#xa0;ensemble algorithms, the RF performed the best. In contrast, the CNN, ABNN, and AdaBoost algorithms have a relatively poorer fit than the other models, and they have many data points with larger normalized residuals at high POC concentrations. This indicates that these three models have lower accuracy in estimating high POC concentrations. The BPNN, XGBoost, and RF algorithms exhibited a better fit, and RF performed well in predicting low and high POC concentrations. This is related to the strong noise immunity of RF, which can effectively reduce the effects of randomness and noise by means of multiple training and averaging predictions (<xref ref-type="bibr" rid="B6">Breiman, 2001</xref>), thus improving the robustness of the model and increasing the estimation accuracy of the POC.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Scatterplot comparing model predicted and true values, where the color of the points represents the magnitude of the normalized residuals. <bold>(A&#x2013;F)</bold> represent Backpropagation Neural Network, Convolutional Neural Network, Attention Neural Network, Adaptive Boosting, Extreme Gradient Boosting and Random Forest, respectively.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g005.tif"/>
</fig>
</sec>
<sec id="s3_2_2">
<label>3.2.2</label>
<title>Accuracy of the model on different waters</title>
<p>To investigate the performance of the machine learning models in estimating POC for different water types, 200 matched POC data points belonging to mineral, organic, and mixed water were randomly sampled from the observed dataset. These data points were used to predict and assess the accuracy of the six trained machine-learning models. <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref> presents the performance of the models in estimating log<sub>10</sub>(POC) for the three water types. The bold indicators in the table represent the best performance of each machine learning model in estimating log<sub>10</sub>(POC) for the three water types. It can be observed that all six machine learning models performed best in estimating the POC for mixed water. The RMSE is less than 0.1 log<sub>10</sub>(mg/m<sup>3</sup>), the MAPE is less than 4%, the variance is less than 0.008, and the absolute value of the bias is less than 0.03. <xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref> illustrates the significant differences in the POC concentration distributions in mineral, mixed, and organic water. These three water types represent low and high POC concentrations, respectively.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Model performance for particulate organic carbon estimation in mineral, mixed, and organic water.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" colspan="2" align="left">Model</th>
<th valign="middle" align="left">RMSE</th>
<th valign="middle" align="left">MAPE</th>
<th valign="middle" align="left">bias</th>
<th valign="middle" align="left">Variance</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="3" align="center">BPNN</td>
<td valign="middle" align="left">Mineral</td>
<td valign="middle" align="left">0.16</td>
<td valign="middle" align="left">4.78%</td>
<td valign="middle" align="left">-0.03</td>
<td valign="middle" align="left">0.02</td>
</tr>
<tr>
<td valign="middle" align="left">Mixed</td>
<td valign="middle" align="left">
<bold>0.07</bold>
</td>
<td valign="middle" align="left">
<bold>1.53%</bold>
</td>
<td valign="middle" align="left">
<bold>-0.005</bold>
</td>
<td valign="middle" align="left">
<bold>0.004</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Organic</td>
<td valign="middle" align="left">0.19</td>
<td valign="middle" align="left">4.92%</td>
<td valign="middle" align="left">0.08</td>
<td valign="middle" align="left">0.03</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="center">CNN</td>
<td valign="middle" align="left">Mineral</td>
<td valign="middle" align="left">0.26</td>
<td valign="middle" align="left">9.91%</td>
<td valign="middle" align="left">-0.17</td>
<td valign="middle" align="left">0.04</td>
</tr>
<tr>
<td valign="middle" align="left">Mixed</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">
<bold>3.62%</bold>
</td>
<td valign="middle" align="left">
<bold>-0.006</bold>
</td>
<td valign="middle" align="left">
<bold>0.008</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Organic</td>
<td valign="middle" align="left">0.31</td>
<td valign="middle" align="left">10.24%</td>
<td valign="middle" align="left">0.19</td>
<td valign="middle" align="left">0.06</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="center">ABNN</td>
<td valign="middle" align="left">Mineral</td>
<td valign="middle" align="left">0.27</td>
<td valign="middle" align="left">11.3%</td>
<td valign="middle" align="left">-0.19</td>
<td valign="middle" align="left">0.04</td>
</tr>
<tr>
<td valign="middle" align="left">Mixed</td>
<td valign="middle" align="left">
<bold>0.09</bold>
</td>
<td valign="middle" align="left">
<bold>3.98%</bold>
</td>
<td valign="middle" align="left">
<bold>-0.03</bold>
</td>
<td valign="middle" align="left">
<bold>0.007</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Organic</td>
<td valign="middle" align="left">0.32</td>
<td valign="middle" align="left">11.14%</td>
<td valign="middle" align="left">0.22</td>
<td valign="middle" align="left">0.06</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="center">AdaBoost</td>
<td valign="middle" align="left">Mineral</td>
<td valign="middle" align="left">0.25</td>
<td valign="middle" align="left">11.33%</td>
<td valign="middle" align="left">-0.18</td>
<td valign="middle" align="left">0.03</td>
</tr>
<tr>
<td valign="middle" align="left">Mixed</td>
<td valign="middle" align="left">
<bold>0.08</bold>
</td>
<td valign="middle" align="left">
<bold>3.83%</bold>
</td>
<td valign="middle" align="left">
<bold>-0.03</bold>
</td>
<td valign="middle" align="left">
<bold>0.006</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Organic</td>
<td valign="middle" align="left">0.34</td>
<td valign="middle" align="left">13.72%</td>
<td valign="middle" align="left">0.28</td>
<td valign="middle" align="left">0.036</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="center">RF</td>
<td valign="middle" align="left">Mineral</td>
<td valign="middle" align="left">0.16</td>
<td valign="middle" align="left">6.19%</td>
<td valign="middle" align="left">0.06</td>
<td valign="middle" align="left">0.02</td>
</tr>
<tr>
<td valign="middle" align="left">Mixed</td>
<td valign="middle" align="left">
<bold>0.05</bold>
</td>
<td valign="middle" align="left">
<bold>1.06%</bold>
</td>
<td valign="middle" align="left">
<bold>0.006</bold>
</td>
<td valign="middle" align="left">
<bold>0.002</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Organic</td>
<td valign="middle" align="left">0.09</td>
<td valign="middle" align="left">4.67%</td>
<td valign="middle" align="left">-0.11</td>
<td valign="middle" align="left">0.03</td>
</tr>
<tr>
<td valign="middle" rowspan="3" align="center">XGboost</td>
<td valign="middle" align="left">Mineral</td>
<td valign="middle" align="left">0.17</td>
<td valign="middle" align="left">5.80%</td>
<td valign="middle" align="left">-0.08</td>
<td valign="middle" align="left">0.02</td>
</tr>
<tr>
<td valign="middle" align="left">Mixed</td>
<td valign="middle" align="left">
<bold>0.04</bold>
</td>
<td valign="middle" align="left">
<bold>1.76%</bold>
</td>
<td valign="middle" align="left">
<bold>-0.002</bold>
</td>
<td valign="middle" align="left">
<bold>0.002</bold>
</td>
</tr>
<tr>
<td valign="middle" align="left">Organic</td>
<td valign="middle" align="left">0.22</td>
<td valign="middle" align="left">6.70%</td>
<td valign="middle" align="left">0.13</td>
<td valign="middle" align="left">0.03</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>BPNN, Backpropagation Neural Network; CNN, Convolutional Neural Network; ABNN, Attention-Based Neural Network; RF, Random Forest; AdaBoost, Adaptive Boosting; XGBoost, eXtreme Gradient Boosting; RMSE, Root Mean Square Error; MAPE , mean absolute percentage error.</p>
</fn>
<fn>
<p>The bold indicators in the table represent the best performance of each machine learning model in estimating log10(POC) for the three water types.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>As shown in <xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>, except for the RF algorithm, the other five machine learning algorithms had higher prediction accuracies for mineral water than organic water, indicating that these five algorithms performed better in estimating low POC values. The RF algorithm had better estimation accuracy for organic water than mineral water, indicating that the RF model can better estimate high POC concentrations. <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref> normalizes the RMSE, MAPE, variance, and bias metrics, allowing for a visual comparison of the performance of each model for the three water types. The BPNN performed the best in mineral water, RF performed the best in mixed water, and RF demonstrated a significantly higher accuracy in estimating organic water than the other models. In contrast, CNN, ABNN, and AdaBoost performed relatively poorly for all three water types.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Radar plots of the performance of machine learning models for estimating particulate organic carbon in: <bold>(A)</bold> mineral water; <bold>(B)</bold> mixed water; <bold>(C)</bold> organic water.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g006.tif"/>
</fig>
<p>In summary, the six machine learning models had good estimation performances for the moderate POC concentration range represented by mixed water (30 mg/m<sup>3</sup>&#x2013;100 mg/m<sup>3</sup>). The BPNN achieved higher estimation accuracy for low POC concentrations represented by mineral water (10 mg/m<sup>3</sup>&#x2013;30 mg/m<sup>3</sup>). In comparison, RF performed better in estimating high POC concentrations represented by organic water (&gt;100 mg/m<sup>3</sup>).</p>
</sec>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Model application</title>
<sec id="s3_3_1">
<label>3.3.1</label>
<title>Comparison with NASA&#x2019;s POC products in space and time</title>
<p>This study compared global POC estimation products using RF and BPNN and band-ratio algorithms in terms of spatial and temporal analysis. The National Aeronautics and Space Administration (NASA) has utilized the blue-to-green band ratio algorithm to estimate POC concentrations in global oceans. This algorithm used the ratio of Rrs(443nm) to Rrs(555nm) from MODIS (<xref ref-type="bibr" rid="B54">Stramski et&#xa0;al., 2008</xref>). This study obtained NASA global POC products from the NASA OCEAN COLOR, spanning 2007 to 2017, for spatial and temporal analyses. Products from 2007 to 2016 were used for interannual POC variation analysis, whereas products from 2017 were used for spatial distribution analysis.</p>
<p>
<xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref> shows the spatial distribution of the global POC concentrations estimated using the RF, BPNN, and NASA standard POC product for 2017. <xref ref-type="fig" rid="f7">
<bold>Figure&#xa0;7</bold>
</xref> shows that the spatial distributions of POC concentrations estimated by the three algorithms were similar worldwide. In global oceans, POC concentrations are mostly below 100 mg/m<sup>3</sup> in the Atlantic, Pacific and Indian Oceans, but above 100 mg/m3 in the Arctic Ocean. Additionally, POC concentrations in coastal waters were significantly higher than in open ocean waters, because of the abundant land-based input of nutrients to coastal waters, and the intense water mass movements that cause bottom nutrients to be transported to the surface layer, which promotes phytoplankton growth and increases the efficiency of POC production (<xref ref-type="bibr" rid="B25">Lao et&#xa0;al., 2023b</xref>).</p>
<fig id="f7" position="float">
<label>Figure&#xa0;7</label>
<caption>
<p>The global POC concentration distribution in 2017, estimated using three algorithms: <bold>(A)</bold> band ratio, <bold>(B)</bold> backpropagation neural network, and <bold>(C)</bold>random forest.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g007.tif"/>
</fig>
<p>
<xref ref-type="fig" rid="f8">
<bold>Figure&#xa0;8</bold>
</xref> presents the deviation and percentage deviation of the global POC concentrations estimated by the RF and BPNN compared to NASA standard POC product. In the Arctic Ocean, the BPNN estimated significantly higher POC concentrations than the NASA standard POC product, with deviations exceeding 75 mg/m<sup>3</sup> and percentage deviations exceeding 50%. However, the RF algorithm showed little deviation from the NASA standard POC product in the Arctic Ocean, with some regions showing lower POC concentrations of more than 50 mg/m<sup>3</sup> and a percentage deviation exceeding 30%. In the Pacific, Atlantic, and Indian Oceans, the RF algorithm showed minimal deviation from the NASA standard POC product, with the Atlantic region having slightly lower POC concentrations and the Pacific and Indian Oceans having slightly higher POC concentrations. The deviation was less than 15 mg/m<sup>3,</sup> and the percentage deviation was less than 40%. In contrast, the BPNN exhibited lower POC concentrations than the NASA standard POC product in the central Atlantic, central Pacific, and northern Indian Oceans. Although the deviation was within 25 mg/m<sup>3</sup>, the percentage deviation exceeded 50%, indicating that the BPNN can improve the estimation of POC concentrations in part of the open ocean. In the Antarctic Ocean, the RF algorithm and the BPNN estimated higher POC concentrations than the NASA standard POC product, with a deviation exceeding 50 mg/m<sup>3</sup> and, in some regions, even exceeding 100 mg/m<sup>3</sup>, with a variance exceeding 50%. The NASA reference product uses the blue-green band ratio algorithm, which only considers Rrs and cannot effectively represent the influence of water components such as chlorophyll on POC. In polar ocean, the melting of glaciers increases the input of nutrient-rich water, promoting the growth of surface phytoplankton, leading to significantly higher chlorophyll-a concentrations compared to low-latitude seas (<xref ref-type="bibr" rid="B2">Babin et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B1">Arrigo, 2005</xref>; <xref ref-type="bibr" rid="B52">Steinacher et&#xa0;al., 2008</xref>). The RF and BPNN estimation models utilize Chl-a, which can effectively reflect the relationship between Chl-a and POC. Therefore, it is reasonable for RF and BPNN to exhibit certain differences from the NASA reference product in polar ocean. Moreover, in the Persian Gulf, Red Sea, and Arabian Sea, the RF algorithm showed significantly higher results than the reference products, with a deviation exceeding 100 mg/m<sup>3</sup> and a percentage deviation exceeding 50%. These waters are strongly influenced by the monsoon winds of the Indian Ocean, which cause upwelling of deep water to the sea surface, promoting the mixing and transport of nutrients. Additionally, certain areas may also be affected by nutrient-rich water inputs from the Red Sea and the Persian Gulf, leading to possible occurrences of eutrophication in some sea areas (<xref ref-type="bibr" rid="B23">Kumar et&#xa0;al., 2000</xref>). The abundant nutrients facilitate the growth of phytoplankton in these waters, further promoting the production of POC and resulting in elevated POC concentrations.</p>
<fig id="f8" position="float">
<label>Figure&#xa0;8</label>
<caption>
<p>Deviation and percentage deviation between the 2017 global POC concentration estimated by random forest and backpropagation neural network algorithms and NASA&#x2019;s particulate organic carbon standard algorithm. <bold>(A)</bold> Deviation of the back propagation neural network from the NASA standard algorithm for estimating POC. <bold>(B)</bold> Percentage deviation of the back propagation neural network from the NASA standard algorithm for estimating POC. <bold>(C)</bold> Deviation of the random forest from the NASA standard algorithm for estimating POC. <bold>(D)</bold> Percentage deviation of the random forest from the NASA standard algorithm for estimating POC.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g008.tif"/>
</fig>
<p>Overall, the BPNN performed better than the RF algorithm in estimating open ocean POC concentrations. The RF algorithm showed a minor difference from the NASA standard POC product in the open ocean regions, with a percentage deviation of approximately 20%. However, in some coastal areas, the RF algorithm estimates higher POC concentrations than the NASA standard POC product, which helps improve the underestimation of POC concentrations by the band ratio algorithm in coastal waters.</p>
<p>
<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref> shows the annual average variations in global POC concentrations estimated by the NASA standard POC product, the random forest (RF) algorithm, and the BPNN between 2007 and 2016. The annual average values estimated by the NASA standard POC product range from 85 mg/m<sup>3</sup> to 100 mg/m<sup>3</sup>. In contrast, the annual average POC concentrations estimated using the BPNN and RF algorithm ranged from 60 mg/m<sup>3</sup> to 70 mg/m<sup>3</sup>. The average percentage deviation of the BPNN from the NASA standard POC product is 27.15%. In comparison, the RF algorithm has an average deviation of 25.33% from the NASA standard POC product. This deviation can be attributed to two factors.</p>
<fig id="f9" position="float">
<label>Figure&#xa0;9</label>
<caption>
<p>Annual changes in global POC from 2007 to 2016 as estimated by the blue-to-green band ratio, backpropagation neural network, and random forest algorithm.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g009.tif"/>
</fig>
<p>First, the NASA global standard POC product includes estimates of POC concentrations in inland waters. Although inland waters have smaller surface areas than oceans, they may have higher POC contents. This is because inland waters are usually shallower, making it easier for light to penetrate to the bottom of the water. This promotes active photosynthesis and higher biological productivity. At the same time, inland waters are influenced by input substances, organisms, and human activities from land, such as organic matter, nutrients, and pollutants carried by rivers, which may result in relatively higher POC content (<xref ref-type="bibr" rid="B67">Yang et&#xa0;al., 2016</xref>). This affected the average value of the NASA global POC product to some extent. Second, POC concentrations can exceed 10,000 mg/m3 (<xref ref-type="bibr" rid="B52">Steinacher et&#xa0;al., 2008</xref>). The measured POC values collected in this study range from 1.46 mg/m3 to 4743 mg/m3, and there are relatively few measured points with high POC concentrations. This caused the trained model to underestimate the values of high POC concentrations. Combining these two factors, the machine learning model estimates global average annual POC value is lower than the average annual POC value in NASA&#x2019;s standard POC product.</p>
<p>
<xref ref-type="fig" rid="f9">
<bold>Figure&#xa0;9</bold>
</xref> shows that, from 2007 to 2011, the global mean POC estimated by the RF algorithm and the NASA standard product increased. From 2011 to 2014, there was a slight decrease in global mean POC; from 2014 to 2016, there was a subsequent increase. In contrast, the BPNN estimated an increase in global POC from 2007 to 2009, a decrease from 2009 to 2013, and an increase from 2013 to 2017. Regarding the annual trends, the RF estimation of the global mean POC showed better consistency with the NASA standard product than with the BPNN, and the RF-estimated POC product can be used to investigate the spatial and temporal trends in POC in various global ocean areas.</p>
</sec>
<sec id="s3_3_2" sec-type="results">
<label>3.3.2</label>
<title>Results of the random forest algorithm for estimating global surface POC</title>
<p>The BPNN and random forest algorithm performed well in estimating global surface POC concentrations. However, the Random Forest algorithm provides a better estimate of POC in coastal waters. This study estimated the global surface POC concentration from 2007 to 2016 using the random forest algorithm and discussed the variations in POC in different ocean regions during this period.</p>
<p>
<xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10</bold>
</xref> illustrates the distribution of global surface POC concentrations from 2007 to 2016, which indicates a consistent spatial distribution of POC over the 10-year period. The global biomass of zooplankton is higher in the coastal zone than in the open ocean due to sufficient land inputs, abundant sunlight and nutrient-rich currents. The distribution of surface POC is higher in the coastal zone than in the open ocean. <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10</bold>
</xref> shows that surface POC concentrations are significantly higher in nearshore areas (e.g., the Arabian Sea, off China and off Angola) than in other areas. Indeed, the distribution of surface POC concentrations is also related to latitude. <xref ref-type="fig" rid="f10">
<bold>Figure&#xa0;10</bold>
</xref> shows that high-latitude regions, such as the Arctic Ocean, Antarctic waters, North and South Atlantic, and North and South Pacific, have higher surface POC concentrations than middle and low-latitude regions. This was related to several factors.</p>
<fig id="f10" position="float">
<label>Figure&#xa0;10</label>
<caption>
<p>
<bold>(A&#x2013;J)</bold> Represent global particulate organic carbon distribution from 2007 to 2016 estimated using the random forest algorithm.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g010.tif"/>
</fig>
<p>First, nutrients provided by water transport have a significant impact on the growth of phytoplankton (<xref ref-type="bibr" rid="B42">Sardessai et&#xa0;al., 2010</xref>; <xref ref-type="bibr" rid="B64">Xu et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B25">Lao et&#xa0;al., 2023b</xref>), including enhanced vertical mixing (<xref ref-type="bibr" rid="B26">Lao et&#xa0;al., 2023c</xref>), which directly affects the distribution of organic matter content in the ocean (<xref ref-type="bibr" rid="B65">Yamashita et&#xa0;al., 2019</xref>; <xref ref-type="bibr" rid="B59">Wang et&#xa0;al., 2021</xref>).</p>
<p>Water masses are more strongly mixed at high latitudes due to cold water, glacial melt, polar eddies, and boundary currents, and these fluid movements bring deep organic matter (e.g., dead organisms and detritus) to the surface of the oceans, which increases the organic content of the surface layer, enhances the productivity of marine organisms, and increases the production of POC. Secondly, high latitudes have relatively weak sunlight, especially in winter. This limits the photosynthesis of phytoplankton. As a result, they focus on growth and reproduction during the shorter summer months, leading to higher surface POC concentrations (<xref ref-type="bibr" rid="B2">Babin et&#xa0;al., 2003</xref>; <xref ref-type="bibr" rid="B1">Arrigo, 2005</xref>; <xref ref-type="bibr" rid="B52">Steinacher et&#xa0;al., 2008</xref>).</p>
<p>
<xref ref-type="fig" rid="f11">
<bold>Figure&#xa0;11</bold>
</xref> shows the results of classifying the POC products estimated using RF into mineral water, mixed water and organic water for the period 2007-2016. Mineral water is mainly found in the Arctic Ocean, Antarctic waters, and regions between 20&#xb0; and 40&#xb0; north and south latitudes. Mixed water is predominantly found in equatorial regions and the North and South Atlantic and Pacific waters. Organic water was distributed along the continental margins. Although the POC concentration is higher in the Arctic Ocean, intense ocean currents and glacial melting in polar regions result in higher concentrations of suspended particles. This classification implies that the Arctic Ocean region falls under the mineral water category.</p>
<fig id="f11" position="float">
<label>Figure&#xa0;11</label>
<caption>
<p>Distribution of mineral, mixed, and organic water according to particulate organic carbon/suspended particulate matter.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g011.tif"/>
</fig>
<p>Fifty sampling points were selected from the three waters mentioned above. POC concentrations at the sampling points collected between 2007 and 2016 were extracted. The average value of these 50 concentrations represented the average POC concentration of the corresponding waters in the current year. A line graph was plotted to examine the variations in POC concentrations over time in different waters. <xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12</bold>
</xref> shows that the POC concentrations in the mineral and mixed water remained relatively stable over the 10-year period. However, the POC concentration in organic water decreased from 2009 to 2010, increased from 2010 to 2012, and decreased again from 2015 to 2016. POC concentrations at the sea surface may be related to the El Ni&#xf1;o phenomenon. El Ni&#xf1;o leads to an increase in the sea surface temperature in the equatorial Pacific. The stratification of the water column become more pronounced with the increase in sea surface temperature, inhibiting the upwelling of deep eutrophic water to the upper layers, thus affecting phytoplankton growth, which further led to a decrease in primary productivity and a decrease in the concentration of POC in the surface layer of the ocean. Additionally, El Ni&#xf1;o can cause changes in wind patterns and ocean circulation, which may alter the distribution of nutrients in the ocean and affect phytoplankton (<xref ref-type="bibr" rid="B10">Chavez et&#xa0;al., 1999</xref>; <xref ref-type="bibr" rid="B3">Behrenfeld et&#xa0;al., 2006</xref>; <xref ref-type="bibr" rid="B12">Dore et&#xa0;al., 2009</xref>; <xref ref-type="bibr" rid="B25">Lao et&#xa0;al., 2023b</xref>). Indeed, El Ni&#xf1;o events in both 2009-2010 and 2015-2016 can partially explain the variations in POC concentrations observed in organic waters, as shown in <xref ref-type="fig" rid="f12">
<bold>Figure&#xa0;12</bold>
</xref>.</p>
<fig id="f12" position="float">
<label>Figure&#xa0;12</label>
<caption>
<p>Changes in annual mean values of mineral, mixed, and organic water sampling sites from 2007 to 2016.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1295874-g012.tif"/>
</fig>
</sec>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Limitations</title>
<p>This study compared the performances of six machine learning algorithms in estimating POC on the ocean surface. The RF algorithm improved the estimation of POC in areas with complex optical conditions near the coast. A brief discussion was also conducted on the spatiotemporal distribution of the global POC based on RF. However, this study still has some limitations that need to be addressed. These limitations are listed below:</p>
<p>1) The data collected were unevenly distributed in terms of spatial coverage. Most data points are concentrated in the Atlantic, Pacific, and Mediterranean Seas. There is a lack of sufficient measured data in the Indian Ocean and the Arctic Ocean, as well as in some eutrophic regions, such as the Red Sea, Arabian Sea, and Persian Gulf. This can affect the accuracy of the machine-learning model and result in an underestimation of POC concentrations in areas with complex optical conditions near the coast. In the future, more POC data should be collected on a global scale, and the accuracy of the data should be controlled to improve the model&#x2019;s accuracy.</p>
<p>2) This study only produced annual POC products from 2007 to 2016. However, the POC exhibited strong seasonal variability. Therefore, conducting monthly POC estimation in the future would be beneficial, allowing for a more accurate investigation of the spatiotemporal characteristics of global POC.</p>
</sec>
</sec>
<sec id="s4" sec-type="conclusions">
<label>4</label>
<title>Conclusions</title>
<p>This article is based on a large amount of open-source data and has created a large <italic>in-situ</italic> POC dataset distributed in various oceans around the world. By using geodetector, twenty factors closely related to oceanic POC concentration were screened. The dataset was partitioned based on the POC/SPM to ensure the training, validation, and test datasets had similar data distributions. Six machine learning methods were used to construct POC estimation models, with the accuracy being evaluated. By comparing the performances of six different machine learning models and their performances in different water types, it was found that the random forest algorithm achieved the highest accuracy on the test dataset. The RMSE was measured at 0.11 log10(g/m3), the MAPE was 2.73%, the variance reached 0.09, and the bias was only 0.003. The RF estimation of POC had the highest accuracy in organic waters, and the BPNN had the highest accuracy in mineral waters. Furthermore, the RF estimation results showed better consistency with NASA standard products, thereby enhancing the accuracy of POC estimation in optically complex seas. In future research, a high-precision POC estimation model should be constructed based on a large amount of measured data in all types of waters.</p>
<p>Based on the RF model, POC products from 2007 to 2017 were generated, and the spatio-temporal distribution characteristics of global POC during this 10-year period were investigated. The results indicated that the POC concentration in high-latitude seas was higher than that in mid-latitude and low-latitude seas. This could be attributed to the strong fluid motions in high-latitude regions, such as polar eddies and boundary currents, which intensify the mixing of water masses and bring organic materials from deeper layers to the ocean surface, thereby promoting the growth of phytoplankton and increasing the concentration of surface POC. Additionally, the El Ni&#xf1;o phenomenon may be associated with interannual variations in POC, as higher sea surface temperatures and increased seawater stratification during the El Ni&#xf1;o period reduce the upwelling of nutrients from the seafloor, restricting phytoplankton growth and thus lowering the concentration of POC in the surface layer. El Ni&#xf1;o events in both 2009-2010 and 2015-2016 can partially explain the variations in POC concentrations observed in organic waters. In future studies, seasonal-scale variations in POC should be investigated, and the relevant drivers of changes in POC concentrations should be studied in greater depth.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="supplementary-material" rid="SM1">
<bold>Supplementary Material</bold>
</xref>. Further inquiries can be directed to the corresponding author.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>HW: Conceptualization, Funding acquisition, Methodology, Project administration, Supervision, Writing &#x2013; review &amp; editing. LC: Data curation, Formal Analysis, Methodology, Resources, Software, Validation, Visualization, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. LW: Resources, Software, Validation, Visualization, Writing &#x2013; review &amp; editing. RS: Investigation, Writing &#x2013; review &amp; editing. ZZ: Data curation, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This research was funded by Key Laboratory of Land Satellite Remote Sensing Application, Ministry of Natural Resources of the People&#x2019; s Republic of China, grant numbers G202211, and the Ministry of Education Industry- University Collaborative Education Project, grant numbers 220504039151258, and the Fundamental Research Funds for the Central Universities, grant numbers 18CX02064A.</p>
</sec>
<ack>
<title>Acknowledgments</title>
<p>We are grateful to the NASA Ocean Biology Processing Group for providing MODIS products (<ext-link ext-link-type="uri" xlink:href="https://oceancolor.gsfc.nasa.gov/">https://oceancolor.gsfc.nasa.gov/</ext-link>) and <italic>in situ</italic> data from seabass (<ext-link ext-link-type="uri" xlink:href="https://seabass.gsfc.nasa.gov/">https://seabass.gsfc.nasa.gov/</ext-link>); We are grateful to Copernicus Marine Service (<ext-link ext-link-type="uri" xlink:href="https://marine.copernicus.eu/">https://marine.copernicus.eu/</ext-link>) providing remote sensing reanalysis data.</p>
</ack>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2023.1295874/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2023.1295874/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet_1.pdf" id="SM1" mimetype="application/pdf"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Arrigo</surname> <given-names>K. R.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Marine microorganisms and global nutrient cycles</article-title>. <source>nat.</source> <volume>437</volume>, <fpage>349</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature04265</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Babin</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Morel</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Fournier-Sicre</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Fell</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Stramski</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Light scattering properties of marine particles in coastal and open ocean waters as related to the particle mass concentration</article-title>. <source>Limnology Oceanogr.</source> <volume>48</volume> (<issue>2</issue>), <fpage>843</fpage>&#x2013;<lpage>859</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4319/lo.2003.48.2.0843</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Behrenfeld</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>O Malley</surname> <given-names>R. T.</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>D. A.</given-names>
</name>
<name>
<surname>Mcclain</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>Sarmiento</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Feldman</surname> <given-names>G. C.</given-names>
</name>
<etal/>
</person-group>. (<year>2006</year>). <article-title>Climate-driven trends in contemporary ocean productivity</article-title>. <source>Nature</source> <volume>444</volume> (<issue>7120</issue>), <fpage>752</fpage>&#x2013;<lpage>755</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature05317</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bonelli</surname> <given-names>A. G.</given-names>
</name>
<name>
<surname>Loisel</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Jorge</surname> <given-names>D. S. F.</given-names>
</name>
<name>
<surname>Mangin</surname> <given-names>A.</given-names>
</name>
<name>
<surname>D'Andon</surname> <given-names>O. F.</given-names>
</name>
<name>
<surname>Vantrepotte</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A new method to estimate the dissolved organic carbon concentration from remote sensing in the global open ocean</article-title>. <source>Remote Sens. Environ.</source> <volume>281</volume>, <elocation-id>113227</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2022.113227</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bopp</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Le Qu&#xe9;r&#xe9;</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Heimann</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Manning</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>Monfray</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Climate-induced oceanic oxygen fluxes: Implications for the contemporary carbon budget</article-title>. <source>Global Biogeochem. Cycles.</source> <volume>16</volume> (<issue>2</issue>), <fpage>6</fpage>&#x2013;<lpage>1-6-13</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2001GB001445</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume> (<issue>1</issue>), <fpage>5</fpage>&#x2013;<lpage>32</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brewin</surname> <given-names>R. J. W.</given-names>
</name>
<name>
<surname>Sathyendranath</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Platt</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Bouman</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Ciavatta</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Dall'Olmo</surname> <given-names>G.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Sensing the ocean biological carbon pump from space: A review of capabilities, concepts, research gaps and future developments</article-title>. <source>Earth-Sci. Rev.</source> <volume>217</volume>, <elocation-id>103604</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.earscirev.2021.103604</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cai</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Le</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Satellite observation of the long-term dynamics of particulate organic carbon in the east China Sea based on a hybrid algorithm</article-title>. <source>Remote Sens.</source> <volume>14</volume> (<issue>13</issue>), <elocation-id>3220</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs14133220</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cao</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Ge</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Optimal discretization for geographical detectors-based risk assessment</article-title>. <source>GIScience Remote Sensing.</source> <volume>50</volume> (<issue>1</issue>), <fpage>78</fpage>&#x2013;<lpage>92</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/15481603.2013.778562</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chavez</surname> <given-names>F. P.</given-names>
</name>
<name>
<surname>Strutton</surname> <given-names>P. G.</given-names>
</name>
<name>
<surname>Friederich</surname> <given-names>G. E.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Feldman</surname> <given-names>G. C.</given-names>
</name>
<name>
<surname>Foley</surname> <given-names>D. G.</given-names>
</name>
<etal/>
</person-group>. (<year>1999</year>). <article-title>Biological and chemical response of the equatorial pacific ocean to the 1997-98 El Ni&#xf1;o</article-title>. <source>Science</source> <volume>286</volume> (<issue>5447</issue>), <fpage>2126</fpage>&#x2013;<lpage>2131</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.286.5447.2126</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Devi</surname> <given-names>G. K.</given-names>
</name>
<name>
<surname>Ganasri</surname> <given-names>B. P.</given-names>
</name>
<name>
<surname>Dwarakish</surname> <given-names>G. S.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Applications of remote sensing in satellite oceanography: A review</article-title>. <source>Aquat. Procedia.</source> <volume>4</volume>, <fpage>579</fpage>&#x2013;<lpage>584</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.aqpro.2015.02.075</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dore</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Lukas</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sadler</surname> <given-names>D. W.</given-names>
</name>
<name>
<surname>Church</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Karl</surname> <given-names>D. M.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Physical and biogeochemical modulation of ocean acidification in the central North Pacific</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>106</volume> (<issue>30</issue>), <fpage>12235</fpage>&#x2013;<lpage>12240</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1073/pnas.0906044106</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Doney</surname> <given-names>S. C.</given-names>
</name>
<name>
<surname>Fabry</surname> <given-names>V. J.</given-names>
</name>
<name>
<surname>Feely</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Kleypas</surname> <given-names>J. A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Ocean acidification: the other CO<sub>2</sub> problem</article-title>. <source>Annu. Rev. Mar. Sci.</source> <volume>1</volume>(<issue>1</issue>), <fpage>169</fpage>&#x2013;<lpage>192</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1146/annurev.marine.010908.163834</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Elhorst</surname> <given-names>J. P.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Spatial Panel Data Models</article-title>. In: <person-group person-group-type="editor">
<name>
<surname>Fischer</surname> <given-names>M.M.</given-names>
</name>
<name>
<surname>Getis</surname> <given-names>A.</given-names>
</name>
</person-group> (eds). <source>Handbook of Applied Spatial Analysis: Software Tools, Methods and Applications</source> (<publisher-loc>Berlin, Heidelberg</publisher-loc>: <publisher-name>Springer Berlin Heidelberg</publisher-name>). <fpage>377</fpage>&#x2013;<lpage>407</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/978-3-642-03647-7_19</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Freund</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Schapire</surname> <given-names>R. E.</given-names>
</name>
</person-group> (<year>1995</year>). "<article-title>A decision-thoretic generalization of on-line learning and an application to boosting</article-title>," in <source>Computational Learning Theory. EuroCOLT 1995. Lecture Notes in Computer Science</source>, eds <person-group person-group-type="editor">
<name>
<surname>Vit&#xe1;nyi</surname> <given-names>P.</given-names>
</name>
</person-group> (<publisher-loc>Berlin, Heidelberg</publisher-loc>: <publisher-name>Springer</publisher-name>) <volume>55</volume> (<issue>1</issue>), <fpage>119</fpage>&#x2013;<lpage>139</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/3-540-59119-2_166</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gardner</surname> <given-names>W. D.</given-names>
</name>
<name>
<surname>Mishonov</surname> <given-names>A. V.</given-names>
</name>
<name>
<surname>Richardson</surname> <given-names>M. J.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Global POC concentrations from <italic>in-situ</italic> and satellite data</article-title>. <source>Deep Sea Res. Part II: Topical Stud. Oceanogr.</source> <volume>53</volume> (<issue>5</issue>), <fpage>718</fpage>&#x2013;<lpage>740</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.dsr2.2006.01.029</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Good</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Fiedler</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Mao</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Martin</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Worsfold</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The current configuration of the OSTIA system for operational production of foundation sea surface temperature and ice concentration analyses</article-title>. <source>Remote Sens.</source> <volume>12</volume> (<issue>4</issue>), <fpage>720</fpage>&#x2013;. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs12040720</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hayley</surname> <given-names>E. K.</given-names>
</name>
<name>
<surname>Victor</surname> <given-names>M. V.</given-names>
</name>
<name>
<surname>Brewin</surname> <given-names>R. J. W.</given-names>
</name>
<name>
<surname>Giorgio</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Hickman</surname> <given-names>A. E.</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2017</year>). <article-title>Validation and intercomparison of ocean color algorithms for estimating particulate organic carbon in the oceans</article-title>. <source>Front. Mar. Sci.</source> <volume>4</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2017.00251</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jahnke</surname>
</name>
<name>
<surname>Richard</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>The global ocean flux of particulate organic carbon: Areal distribution and magnitude</article-title>. <source>Global Biogeochem. Cycles.</source> <volume>10</volume> (<issue>1</issue>), <fpage>71</fpage>&#x2013;<lpage>88</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/95GB03525</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jiang</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Loiselle</surname> <given-names>S. A.</given-names>
</name>
<name>
<surname>Cai</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Duan</surname>
</name>
</person-group> (<year>2015</year>). <article-title>Remote sensing of particulate organic carbon dynamics in a eutrophic lake (Taihu Lake, China)</article-title>. <source>Sci. Total Environ.</source> <volume>532</volume>, <fpage>245</fpage>&#x2013;<lpage>254</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.scitotenv.2015.05.120</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Hwang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Na</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Hyun</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Carbon cycling in the East Sea (Japan Sea): A review</article-title>. <source>Front. Mar. Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2022.938935</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Krishnapuram</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Shah</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Smola</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Aggarwal</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Shen</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Rastogi</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <source>KDD '16: The 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source> (<publisher-loc>San Francisco, California, USA</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>). doi:&#xa0;<pub-id pub-id-type="doi">10.1145/2939672</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kumar</surname> <given-names>S. P.</given-names>
</name>
<name>
<surname>Madhupratap</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kumar</surname> <given-names>M. D.</given-names>
</name>
<name>
<surname>Gauns</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Muraleedharan</surname> <given-names>P. M.</given-names>
</name>
<name>
<surname>Sarma</surname> <given-names>V. V. S. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2000</year>). <article-title>Physical control of primary productivity on a seasonal scale in central and eastern Arabian Sea</article-title>. <source>J. Earth Syst. Sci.</source> <volume>109</volume>, <fpage>433</fpage>&#x2013;<lpage>441</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02708331</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lao</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>a). <article-title>Characteristics and mechanisms of typhoon-induced decomposition of organic matter and its implication for climate change</article-title>. <source>J. Geophysical Research: Biogeosciences</source> <volume>128</volume> (<issue>6</issue>), <elocation-id>e2023JG007518</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2023JG007518</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lao</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ling</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>b). <article-title>External dynamic mechanisms controlling the periodic offshore blooms in Beibu gulf</article-title>. <source>J. Geophysical Research: Oceans</source> <volume>128</volume> (<issue>6</issue>), <elocation-id>e2023JC019689</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2023JC019689</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lao</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Lu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Jin</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>c). <article-title>Effects of upwelling and runoff on water mass mixing and nutrient supply induced by typhoons: Insight from dual water isotopes tracing</article-title>. <source>Limnology Oceanogr.</source> <volume>68</volume> (<issue>1</issue>), <fpage>284</fpage>&#x2013;<lpage>295</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/lno.12266</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lavergne</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Srensen</surname> <given-names>A. M.</given-names>
</name>
<name>
<surname>Kern</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Tonboe</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Pedersen</surname> <given-names>L. T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Version 2 of the EUMETSAT OSI SAF and ESA CCI sea-ice concentration climate data records</article-title>. <source>Cryosphere.</source> <volume>13</volume> (<issue>1</issue>), <fpage>49</fpage>&#x2013;<lpage>78</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/tc-13-49-2019</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Le</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Lehrter</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Macintyre</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Beck</surname> <given-names>M. W.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Satellite observation of particulate organic carbon dynamics on the Louisiana continental shelf</article-title>. <source>J. Geophysical Research: Oceans.</source> <volume>122</volume> (<issue>1</issue>), <fpage>555</fpage>&#x2013;<lpage>569</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/2016JC012275</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lecun</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Hinton</surname> <given-names>G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Deep learning</article-title>. <source>Nature</source> <volume>521</volume> (<issue>7553</issue>), <fpage>436</fpage>&#x2013;<lpage>444</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/nature14539</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lecun</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Bottou</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Bengio</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Haffner</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>Gradient-based learning applied to document recognition</article-title>. <source>Proc. IEEE.</source> <volume>86</volume> (<issue>11</issue>), <fpage>2278</fpage>&#x2013;<lpage>2324</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/5.726791</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Bai</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>Q.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Improving satellite retrieval of oceanic particulate organic carbon concentrations using machine learning methods</article-title>. <source>Remote Sens. Environ.</source> <volume>256</volume>, <elocation-id>112316</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2021.112316</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Loisel</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Bosc</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Stramski</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Oubelkheir</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Deschamps</surname> <given-names>P. Y.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Seasonal variability of the backscattering coefficient in the Mediterranean Sea based on satellite SeaWiFS imagery</article-title>. <source>Geophys. Res. Lett.</source> <volume>28</volume> (<issue>22</issue>), <fpage>4203</fpage>&#x2013;<lpage>4206</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2001GL013863</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Loisel</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Nicolas</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Deschamps</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Frouin</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Seasonal and inter-annual variability of particulate organic matter in the global ocean</article-title>. <source>Geophys. Res. Lett.</source> <volume>29</volume> (<issue>24</issue>), <fpage>49</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2002GL015948</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Maritorena</surname> <given-names>S.</given-names>
</name>
<name>
<surname>D'Andon</surname> <given-names>O. H. F.</given-names>
</name>
<name>
<surname>Mangin</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Siegel</surname> <given-names>D. A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Merged satellite ocean color data products using a bio-optical model: Characteristics, benefits and issues</article-title>. <source>Remote Sens. Environ.</source> <volume>114</volume> (<issue>8</issue>), <fpage>1791</fpage>&#x2013;<lpage>1804</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2010.04.002</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Martiny</surname> <given-names>A. C.</given-names>
</name>
<name>
<surname>Vrugt</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Lomas</surname> <given-names>M. W.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Concentrations and ratios of particulate organic carbon, nitrogen, and phosphorus in the global ocean</article-title>. <source>Sci. Data.</source> <volume>1</volume> (<issue>1</issue>), <fpage>140048</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/sdata.2014.48</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Massari</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Camici</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Ciabatta</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Brocca</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Exploiting satellite-based surface soil moisture for flood forecasting in the Mediterranean area: state update versus rainfall correction</article-title>. <source>Remote Sensing.</source> <volume>10</volume> (<issue>2</issue>), <elocation-id>292</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs10020292</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mcculloch</surname> <given-names>W. S.</given-names>
</name>
<name>
<surname>Pitts</surname> <given-names>W.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>A logical calculus of the ideas immanent in nervous activity</article-title>. <source>Bull. Math. Biol.</source> <volume>52</volume> (<issue>1</issue>), <fpage>99</fpage>&#x2013;<lpage>115</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/BF02459570</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Merchant</surname> <given-names>C. J.</given-names>
</name>
<name>
<surname>Embury</surname> <given-names>O.</given-names>
</name>
<name>
<surname>Bulgin</surname> <given-names>C. E.</given-names>
</name>
<name>
<surname>Block</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Donlon</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Satellite-based time-series of sea-surface temperature since 1981 for climate applications</article-title>. <source>Sci. Data.</source> <volume>6</volume> (<issue>1</issue>), <fpage>223</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41597-019-0236-x</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morel</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Prieur</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>1977</year>). <article-title>Analysis of variations in ocean color</article-title>. <source>Limnol. Oceanogr.</source> <volume>22</volume> (<issue>4</issue>), <fpage>709</fpage>&#x2013;<lpage>722</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.4319/lo.1977.22.4.0709</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>O'Reilly</surname> <given-names>J. E.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Ocean color chlorophyll algorithms for SeaWiFS, OC2, and OC4 : Ver 4</article-title>. <source>SeaWiFS Postlaunch Calibration and Validation Analyses, Part 3. NASA Tech. Memo.</source> <volume>11</volume>, <fpage>9</fpage>&#x2013;<lpage>27</lpage>. Available at: <uri xlink:href="https://cir.nii.ac.jp/crid/1570572701233940096">https://cir.nii.ac.jp/crid/1570572701233940096</uri>.</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>O'Reilly</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Werdell</surname> <given-names>P. J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Chlorophyll algorithms for ocean color sensors-OC4, OC5 &amp; OC6</article-title>. <source>Remote Sens. Environ.: Interdiscip. J.</source> <volume>229</volume>, <fpage>32</fpage>&#x2013;<lpage>47</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2019.04.021</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sardessai</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Shetye</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Maya</surname> <given-names>M. V.</given-names>
</name>
<name>
<surname>Mangala</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Prasanna Kumar</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Nutrient characteristics of the water masses and their seasonal variability in the eastern equatorial Indian Ocean</article-title>. <source>Mar. Environ. Res.</source> <volume>70</volume> (<issue>3</issue>), <fpage>272</fpage>&#x2013;<lpage>282</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.marenvres.2010.05.009</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Sarmiento</surname> <given-names>J. L.</given-names>
</name>
</person-group> (<year>2006</year>). <source>Ocean Biogeochemical Dynamics</source>. <publisher-name>Princeton University Press</publisher-name>. doi:&#xa0;<pub-id pub-id-type="doi">10.1515/9781400849079</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sauz&#xe8;de</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Claustre</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Uitz</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Jamet</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Dall'Olmo</surname> <given-names>G.</given-names>
</name>
<name>
<surname>D'Ortenzio</surname> <given-names>F.</given-names>
</name>
<etal/>
</person-group>. (<year>2016</year>). <article-title>A neural network-based method for merging ocean color and Argo data to extend surface bio-optical properties to depth: Retrieval of the particulate backscattering coefficient</article-title>. <source>J. Geophysical Research: Oceans.</source> <volume>121</volume> (<issue>4</issue>), <fpage>2552</fpage>&#x2013;<lpage>2571</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1002/2015JC011408</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sauz&#xe8;de</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Johnson</surname> <given-names>J. E.</given-names>
</name>
<name>
<surname>Claustre</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Camps-Valls</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Ruescas</surname> <given-names>A. B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>ESTIMATION OF OCEANIC PARTICULATE ORGANIC CARBON WITH MACHINE LEARNING</article-title>. <source>ISPRS Ann. Photogramm. Remote Sens. Spatial Inf. Sci.</source> <volume>2</volume>, <fpage>949</fpage>&#x2013;<lpage>956</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/isprs-annals-V-2-2020-949-2020</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sauz&#xe8;de</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Claustre</surname> <given-names>H.</given-names>
</name>
<name>
<surname>R.</surname>
</name>
<name>
<surname>Remanan</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Uitz</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Guinehut</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>New global vertical distribution of gridded particulate organic carbon and chlorophyll-a concentration using machine learning for cmems. 9th EuroGOOS International conference</article-title>. <source>Shom and Ifremer and EuroGOOS AISBL</source>. (<publisher-loc>Brest, France</publisher-loc>), <fpage>313</fpage>&#x2013;<lpage>320</lpage>. <uri xlink:href="https://hal.science/hal-03335370v2">https://hal.science/hal-03335370v2</uri>.</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sawaya</surname> <given-names>K. E.</given-names>
</name>
<name>
<surname>Olmanson</surname> <given-names>L. G.</given-names>
</name>
<name>
<surname>Heinert</surname> <given-names>N. J.</given-names>
</name>
<name>
<surname>Brezonik</surname> <given-names>P. L.</given-names>
</name>
<name>
<surname>Bauer</surname> <given-names>M. E.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Extending satellite remote sensing to local scales: land and water resource monitoring using high-resolution imagery</article-title>. <source>Remote Sens. Environ.</source> <volume>88</volume> (<issue>1</issue>), <fpage>144</fpage>&#x2013;<lpage>156</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2003.04.006</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shahriari</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Swersky</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Adams</surname> <given-names>R. P.</given-names>
</name>
<name>
<surname>De Freitas</surname> <given-names>N.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Taking the human out of the loop: A review of Bayesian optimization</article-title>. <source>Proc. IEEE.</source> <volume>104</volume> (<issue>1</issue>), <fpage>148</fpage>&#x2013;<lpage>175</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1109/JPROC.2015.2494218</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Shi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Ji</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Dai</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Application of synchrosqueezed wavelet transform in microseismic monitoring of mines</article-title>. <conf-name>IOP Conference Series: Earth and Environmental Science</conf-name> <volume>384</volume> (<issue>01</issue>), <fpage>012075</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1088/1755-1315/384/1/012075</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Son</surname> <given-names>Y. B.</given-names>
</name>
<name>
<surname>Gardner</surname> <given-names>W. D.</given-names>
</name>
<name>
<surname>Mishonov</surname> <given-names>A. V.</given-names>
</name>
<name>
<surname>Richardson</surname> <given-names>M. J.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Multispectral remote-sensing algorithms for particulate organic carbon (POC): The Gulf of Mexico</article-title>. <source>Remote Sens. Environ.</source> <volume>113</volume> (<issue>1</issue>), <fpage>50</fpage>&#x2013;<lpage>61</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2008.08.011</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Ge</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>An optimal parameters-based geographical detector model enhances geographic characteristics of explanatory variables for spatial heterogeneity analysis: cases with different types of spatial data</article-title>. <source>GISci. Remote Sens.</source> <volume>57</volume> (<issue>5</issue>), <fpage>593</fpage>&#x2013;<lpage>610</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1080/15481603.2020.1760434</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Steinacher</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Joos</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Fr&#xf6;licher</surname> <given-names>T. L.</given-names>
</name>
<name>
<surname>P.</surname> <given-names>G. K.</given-names>
</name>
<name>
<surname>Doney</surname> <given-names>S. C.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Imminent ocean acidification projected with the NCAR global coupled carbon cycle-climate model</article-title>. <source>Biogeosciences Discussions</source> <volume>5</volume> (<issue>4</issue>), <fpage>4353</fpage>&#x2013;<lpage>4393</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/bgd-5-4353-2008</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stramski</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Joshi</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>R. A.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Ocean color algorithms to estimate the concentration of particulate organic carbon in surface waters of the global ocean in support of a long-term data record from multiple satellite missions</article-title>. <source>Remote Sens. Environ.</source> <volume>269</volume>, <elocation-id>112776</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2021.112776</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stramski</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Babin</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kaczmarek</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lewis</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>R&#xf6;ttgers</surname> <given-names>R.</given-names>
</name>
<etal/>
</person-group>. (<year>2008</year>). <article-title>Relationships between the surface concentration of particulate organic carbon and optical properties in the eastern South Pacific and eastern Atlantic Oceans</article-title>. <source>Biogeosciences</source> <volume>5</volume> (<issue>1</issue>), <fpage>171</fpage>&#x2013;<lpage>201</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.5194/bg-5-171-2008</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stramski</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Kahru</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>Estimation of particulate organic carbon in the ocean from satellite remote sensing</article-title>. <source>Science</source> <volume>285</volume> (<issue>5425</issue>), <fpage>239</fpage>&#x2013;<lpage>242</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1126/science.285.5425.239</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tran</surname> <given-names>T. K.</given-names>
</name>
<name>
<surname>Dufor&#xea;t-Gaurier</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Vantrepotte</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Jorge</surname> <given-names>D. S. F.</given-names>
</name>
<name>
<surname>M&#xe9;riaux</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Cauvin</surname> <given-names>A.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Deriving particulate organic carbon in coastal waters from remote sensing: inter-comparison exercise and development of a maximum band-ratio approach</article-title>. <source>Remote Sens.</source> <volume>11</volume> (<issue>23</issue>), <elocation-id>2849</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs11232849</pub-id>
</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verde</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Mallinis</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Tsakiri-Strati</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Georgiadis</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Patias</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Assessment of radiometric resolution impact on remote sensing data classification accuracy</article-title>. <source>Remote Sensing.</source> <volume>10</volume> (<issue>8</issue>), <elocation-id>1267</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs10081267</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Environmental health risk detection with GeogDetector</article-title>. <source>Environ. Modell. Software</source> <volume>33</volume>, <fpage>114</fpage>&#x2013;<lpage>115</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.envsoft.2012.01.015</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Stubbins</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Dahlgren</surname> <given-names>R. A.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Dissolved organic matter dynamics in the epipelagic northwest pacific low-latitude western boundary current system: insights from optical analyses</article-title>. <source>J. Geophysical Research: Oceans</source> <volume>126</volume> (<issue>9</issue>), <elocation-id>e2021JC017458</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2021JC017458</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>F.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>Y.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Research progress on remote sensing inversion of ocean particulate organic carbon</article-title>. <source>J. Hangzhou Normal Univ. (Natural Sci. Edition).</source> <volume>16</volume> (<issue>2</issue>), <fpage>205</fpage>&#x2013;<lpage>212</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3969/j.issn.1674-232X.2017.02.015</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Geodetector: principle and prospective</article-title>. <source>Acta Geographica Sinica.</source> <volume>72</volume> (<issue>01</issue>), <fpage>116</fpage>&#x2013;<lpage>134</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.11821/dlxb201701010</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Werdell</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Bailey</surname> <given-names>S. W.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>An improved bio-optical data set for ocean color algorithm development and satellite data product variation</article-title>. <source>Remote Sens. Environ.</source> <volume>98</volume> (<issue>1</issue>), <fpage>122</fpage>&#x2013;<lpage>140</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.rse.2005.07.001</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wo&#x17a;niak</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>Stramski</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Stramska</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Reynolds</surname> <given-names>R. A.</given-names>
</name>
<name>
<surname>Wright</surname> <given-names>V. M.</given-names>
</name>
<name>
<surname>Miksic</surname> <given-names>E. Y.</given-names>
</name>
<etal/>
</person-group>. (<year>2010</year>). <article-title>Optical variability of seawater in relation to particle concentration, composition, and size distribution in the nearshore marine environment at Imperial Beach, California</article-title>. <source>J. Geophysical Res.</source> <volume>115</volume>, <fpage>C08027</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2009JC005554</pub-id>
</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Sukigara</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Goes</surname> <given-names>J. I.</given-names>
</name>
<name>
<surname>Do Rosario Gomes</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2019</year>). <article-title>Interannual changes in summer phytoplankton community composition in relation to water mass variability in the East China Sea</article-title>. <source>J. Oceanogr.</source> <volume>75</volume> (<issue>1</issue>), <fpage>61</fpage>&#x2013;<lpage>79</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s10872-018-0484-y</pub-id>
</citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yamashita</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yagi</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Ueno</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Ooki</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Hirawake</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Characterization of the water masses in the shelf region of the Bering and Chukchi seas with fluorescent organic matter</article-title>. <source>J. Geophysical Research: Oceans.</source> <volume>124</volume> (<issue>11</issue>), <fpage>7545</fpage>&#x2013;<lpage>7556</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1029/2019JC015476</pub-id>
</citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Kuo</surname> <given-names>C. C. J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Show, attend, and translate: unsupervised image translation with self-regularization and attention</article-title>. <source>IEEE Trans. Image Process.</source> <volume>28</volume> (<issue>10</issue>), <fpage>4845</fpage>&#x2013;<lpage>4856</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.48550/arXiv.1806.06195</pub-id>
</citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Fu</surname> <given-names>G.</given-names>
</name>
<name>
<surname>He</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Luo</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zheng</surname> <given-names>Z.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Spatiotemporal patterns and source attribution of nitrogen load in a river basin with complex pollution sources</article-title>. <source>Water Res.</source> <volume>94</volume>, <fpage>187</fpage>&#x2013;<lpage>199</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1016/j.watres.2016.02.040</pub-id>
</citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zaneveld</surname> <given-names>J. R. V.</given-names>
</name>
<name>
<surname>Mobley</surname> <given-names>C. D.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Review of light and water: radiative transfer in natural waters, by C. D. Mobley</article-title>. <source>Bull. Amer. Meteorol. Soc</source> <volume>76</volume> (<issue>1</issue>), <fpage>60</fpage>&#x2013;<lpage>63</lpage>. Available at: <uri xlink:href="https://www.jstor.org/stable/2623161">https://www.jstor.org/stable/2623161</uri>.</citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zou</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Tang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Deng</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>A novel method to mitigate the multipath error for BDS-2 dam deformation monitoring</article-title>. <source>Remote Sensing.</source> <volume>13</volume> (<issue>9</issue>), <elocation-id>1787</elocation-id>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/rs13091787</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>