<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" article-type="research-article" dtd-version="2.3" xml:lang="EN">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Mar. Sci.</journal-id>
<journal-title>Frontiers in Marine Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Mar. Sci.</abbrev-journal-title>
<issn pub-type="epub">2296-7745</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmars.2023.1296274</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Marine Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Predicting rapid intensification of tropical cyclones in the western North Pacific: a machine learning and net energy gain rate approach</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Kim</surname>
<given-names>Sung-Hun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1918500"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Lee</surname>
<given-names>Woojeong</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="author-notes" rid="fn001">
<sup>*</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1973344"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kang</surname>
<given-names>Hyoun-Woo</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1518681"/>
<role content-type="https://credit.niso.org/contributor-roles/formal-analysis/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kang</surname>
<given-names>Sok Kuh</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1984790"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-review-editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Korea Institute of Ocean Science and Technology</institution>, <addr-line>Busan</addr-line>, <country>Republic of Korea</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Forecast Research Department, National Institute of Meteorological Sciences</institution>, <addr-line>Seogwipo, Jeju</addr-line>, <country>Republic of Korea</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>Edited by: Scott Glenn, Rutgers, The State University of New Jersey, United States</p>
</fn>
<fn fn-type="edited-by">
<p>Reviewed by: Ahmed Aziz, Rutgers, The State University of New Jersey, United States</p>
<p>Dasol Kim, University of Florida, United States</p>
</fn>
<fn fn-type="corresp" id="fn001">
<p>*Correspondence: Woojeong Lee, <email xlink:href="mailto:lwj@korea.kr">lwj@korea.kr</email>
</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>19</day>
<month>01</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>10</volume>
<elocation-id>1296274</elocation-id>
<history>
<date date-type="received">
<day>18</day>
<month>09</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>29</day>
<month>12</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Kim, Lee, Kang and Kang</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Kim, Lee, Kang and Kang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>In this study, a machine learning (ML)-based Tropical Cyclones (TCs) Rapid Intensification (RI) prediction model has been developed by using the Net Energy Gain Rate Index (<italic>NGR</italic>). This index realistically captures the energy exchanges between the ocean and the atmosphere during the intensification of TCs. It does so by incorporating the thermal conditions of the upper ocean and using an accurate parameterization for sea surface roughness. To evaluate the effectiveness of <italic>NGR</italic> in enhancing prediction accuracy, five distinct ML algorithms were utilized: Decision Tree, Logistic Regression, Support Vector Machine, K-Nearest Neighbors, and Feed-forward Neural Network. Two sets of experiments were performed for each algorithm. The first set used only traditional predictors, while the second set incorporated <italic>NGR</italic>. The outcomes revealed that models trained with the inclusion of <italic>NGR</italic> exhibited superior performance compared to those that only used traditional predictors. Additionally, an ensemble model was developed by utilizing a hard-voting method, combining the predictions of all five individual algorithms. This ensemble approach showed a noteworthy improvement of approximately 10% in the skill score of RI prediction when <italic>NGR</italic> was included. The findings of this study emphasize the potential of <italic>NGR</italic> in refining TC intensity prediction and underline the effectiveness of ensemble ML models in RI event detection.</p>
</abstract>
<kwd-group>
<kwd>rapid intensification of the tropical cyclone</kwd>
<kwd>drag coefficient</kwd>
<kwd>tropical cyclone-ocean interaction</kwd>
<kwd>tropical cyclone-induced vertical ocean mixing</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="7"/>
<equation-count count="10"/>
<ref-count count="63"/>
<page-count count="14"/>
<word-count count="7445"/>
</counts>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-in-acceptance</meta-name>
<meta-value>Ocean Observation</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1" sec-type="intro">
<label>1</label>
<title>Introduction</title>
<p>Tropical cyclones (TCs), as one of the most devastating natural hazards in the world, have caused huge social, and economic damage and loss of life. The recent global TC&#xa0;activity showed a significant increasing trend in major TCs, rapid intensification (RI)&#xa0;events, and TC-induced damage (<xref ref-type="bibr" rid="B1">Balaguru et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B31">Kossin et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B27">Klotzbach&#xa0;et&#xa0;al., 2022</xref>). Many studies have warned the possible serious disasters due to the increase in the very intense TC frequency above category 4 and lifetime maximum intensity, with human-induced climate change (<xref ref-type="bibr" rid="B43">Murakami et&#xa0;al., 2013</xref>; <xref ref-type="bibr" rid="B29">Knutson et&#xa0;al., 2020</xref>). To reduce the damage of the TCs in the future anticipated to become much stronger, the demand for more accurate forecasts of TC intensity is greater than ever. While there has been some recent progress in intensity prediction due to the emergence of several skillful guidance, the prediction of RI defined as a change in maximum sustain wind 30 kt per 24-hr (<xref ref-type="bibr" rid="B20">Kaplan and DeMaria, 2003</xref>) remains a challenging area of several operational TC centers (<xref ref-type="bibr" rid="B9">DeMaria et&#xa0;al., 2021</xref>).</p>
<p>There have been many attempts and efforts to improve intensity change, including RI, prediction skills based on statistical (<xref ref-type="bibr" rid="B10">DeMaria and Kaplan, 1994</xref>; <xref ref-type="bibr" rid="B11">DeMaria and Kaplan, 1999</xref>; <xref ref-type="bibr" rid="B36">Li et&#xa0;al., 2018</xref>) or dynamical approaches (<xref ref-type="bibr" rid="B2">Bender et&#xa0;al., 2007</xref>; <xref ref-type="bibr" rid="B3">Biswas et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B38">Liu et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B62">Zhang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B63">Zhang et&#xa0;al., 2023</xref>), or their combination (<xref ref-type="bibr" rid="B28">Knaff et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B26">Kim et&#xa0;al., 2018</xref>) over past few decades. TC intensity prediction of statistical models have been developed utilizing diverse statistical method such as multiple linear or logistic regression (<xref ref-type="bibr" rid="B10">DeMaria and Kaplan, 1994</xref>; <xref ref-type="bibr" rid="B48">Rozoff and Kossin, 2011</xref>; <xref ref-type="bibr" rid="B36">Li et&#xa0;al., 2018</xref>). The dynamical approaches largely focused on improving model physics (<xref ref-type="bibr" rid="B6">Chen et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B33">Lee et&#xa0;al., 2022</xref>; <xref ref-type="bibr" rid="B56">Wang et&#xa0;al., 2022</xref>), increasing model horizontal and vertical resolutions (<xref ref-type="bibr" rid="B16">Feng and Wang, 2021</xref>; <xref ref-type="bibr" rid="B41">Magnusson et&#xa0;al., 2021</xref>), improving TC vortex initialization (<xref ref-type="bibr" rid="B38">Liu et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B35">Li et&#xa0;al., 2021</xref>) and data assimilation (<xref ref-type="bibr" rid="B62">Zhang et&#xa0;al., 2020</xref>; <xref ref-type="bibr" rid="B40">Lu et&#xa0;al., 2022</xref>).</p>
<p>The statistical-dynamical models have been primarily developed over the decades in two respects: (1) by applying new statistical approaches and (2) by finding atmospheric and oceanic predictors highly related to TC intensity change. With the development of new learning algorithms and computer technology, more complicated machine learning (ML) techniques have been applied to predict TC intensity change, besides conventional statistical regression approaches such as multi-linear (<xref ref-type="bibr" rid="B26">Kim et&#xa0;al., 2018</xref>), Bayesian (<xref ref-type="bibr" rid="B51">Song et&#xa0;al., 2018</xref>), logistic (<xref ref-type="bibr" rid="B48">Rozoff and Kossin, 2011</xref>; <xref ref-type="bibr" rid="B22">Kaplan et&#xa0;al., 2015</xref>) and regression trees (<xref ref-type="bibr" rid="B17">Gao et&#xa0;al., 2016</xref>). <xref ref-type="bibr" rid="B7">Cloud et&#xa0;al. (2019)</xref> and <xref ref-type="bibr" rid="B52">Su et&#xa0;al. (2020)</xref> showed that neural network methods can provide more accurate predictions of TC intensity change, including RI. <xref ref-type="bibr" rid="B49">Shaiba and Hahsler (2016)</xref> predicted RI events with popular ML-based models, support vector machines (SVM), logistic regression, Na&#xef;ve-Bayes classifier, and classification and regression trees classifier. <xref ref-type="bibr" rid="B42">Mercer and Grimes (2017)</xref> performed an ensemble of the three ML methods, SVM, artificial neural networks, and random forests to generate probabilistic RI forecasts for Atlantic TCs. <xref ref-type="bibr" rid="B19">Griffin et&#xa0;al. (2022)</xref> developed a probabilistic model for predicting RI in Atlantic and eastern North Pacific TCs based on a convolutional neural network (CNN). <xref ref-type="bibr" rid="B58">Xu et&#xa0;al. (2021)</xref> developed a TC intensity prediction model based on multilayer perceptron (MLP) for the Atlantic basin. <xref ref-type="bibr" rid="B57">Wei et&#xa0;al. (2023)</xref> used the CNN to predict the occurrence of RI and non-RI. These advanced ML-based prediction results have been shown to outperform skill existing several operational TC intensity guidance.</p>
<p>Before the applying ML methods in TC intensity forecasting, it is known that the statistical-dynamical-based forecast models using climatological, persistence, and numerical model predictors provide the highest skill in intensity (<xref ref-type="bibr" rid="B18">Goldenberg et&#xa0;al., 2015</xref>; <xref ref-type="bibr" rid="B26">Kim et&#xa0;al., 2018</xref>). <xref ref-type="bibr" rid="B59">Yamaguchi et&#xa0;al., 2018</xref>; <xref ref-type="bibr" rid="B58">Xu et&#xa0;al., 2021</xref>; <xref ref-type="bibr" rid="B30">Ko et&#xa0;al., 2023</xref>). The statistical-dynamical model developed by <xref ref-type="bibr" rid="B26">Kim et&#xa0;al. (2018)</xref> showed the smallest mean absolute errors at short lead time (up to 24&#xa0;h) for TC intensity prediction compared to operational dynamical forecast models (<xref ref-type="bibr" rid="B26">Kim et&#xa0;al., 2018</xref>). After a 24-h lead time, their model showed still comparable to the best operational dynamical models such as Global Forecast System (GFS) and Hurricane weather research and forecasting model (HWRF). The Typhoon Intensity Forecast Scheme (TIFS) for western North Pacific (WNP) using SHIPS and Global Spectral Model (GSM) of Japan Meteorological Administration (JMA) showed the considerable forecast skill relative to the GSM and stated that TIFS has helped improve the accuracy of JMA intensity forecasts (<xref ref-type="bibr" rid="B59">Yamaguchi et&#xa0;al., 2018</xref>). With the advent of ML in recent years, ML-based TC intensity prediction studies demonstrated outperformed results the statistical-dynamical models. The MLP model correctly predicted more RI events than other operational TC intensity models as well as outperformed the statistical-dynamical models such as SHIPS, DSHIPS and LGEM by 5-22% in simulating real-time operational forecasts (<xref ref-type="bibr" rid="B58">Xu et&#xa0;al., 2021</xref>). A Consensus Machine Learning (CML) model with the input data extracted from HWRF for TC intensity change, especially for RI reached 56% the probability of detection (POD) and 46% the false alarm ratio (FAR), while the operational models (GFS, HWRF, SHIPS) had only 10-30% POD but 50-60% FAR (<xref ref-type="bibr" rid="B30">Ko et&#xa0;al., 2023</xref>).</p>
<p>The vertical wind shear is the most important atmospheric predictor of TC intensity change, with large wind shear generally being unfavorable for intensification (<xref ref-type="bibr" rid="B10">DeMaria and Kaplan, 1994</xref>). In the oceanic predictors, the intensification potential (POT) defined as the difference between maximum potential intensity (MPI) and maximum wind at the initial time has been considered the most important predictor (<xref ref-type="bibr" rid="B21">Kaplan et&#xa0;al., 2010</xref>). These predictors have been essentially included in the predictor pools in the representative operational TC intensity prediction models, Statistical Hurricane Intensity Prediction Scheme (<xref ref-type="bibr" rid="B10">DeMaria and Kaplan, 1994</xref>; <xref ref-type="bibr" rid="B11">DeMaria and Kaplan, 1999</xref>), and Statistical Typhoon Intensity Prediction Scheme (<xref ref-type="bibr" rid="B28">Knaff et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B26">Kim et&#xa0;al., 2018</xref>).</p>
<p>The MPI enables estimating the theoretical maximum intensity of TC given the atmospheric environment and ocean sea surface temperature (SST) (<xref ref-type="bibr" rid="B14">Emanuel, 1988</xref>; <xref ref-type="bibr" rid="B15">Emanuel, 1995</xref>). However, it often overestimates the maximum intensity of the TC because it does not consider TC-induced SST cooling. <xref ref-type="bibr" rid="B37">Lin et&#xa0;al. (2013)</xref> modified the MPI by using depth-averaged temperature (DAT) (<xref ref-type="bibr" rid="B46">Price, 2009</xref>) instead of SST and suggested the ocean coupling potential intensity (OC_PI). They demonstrated that OC_PI which reflects the ocean cooling effect by TC-induced vertical mixing can more realistically estimate the maximum intensity of TCs than MPI. Although the effects and importance of wind speed-dependent exchange coefficients on TCs have been demonstrated in several previous studies (<xref ref-type="bibr" rid="B45">Ooyama, 1969</xref>; <xref ref-type="bibr" rid="B13">Emanuel, 1986</xref>), the OC_PI still uses a default value of the enthalpy exchange coefficient (<italic>C<sub>k</sub>
</italic>) and drag coefficient (<italic>C<sub>d</sub>
</italic>). <xref ref-type="bibr" rid="B32">Lee et&#xa0;al. (2019)</xref>; LEE19 emphasized that changes in sea surface roughness due to wind significantly impact flux exchange in the air-sea interface. They revised the OC_PI by calculating a more realistic frictional dissipation, considering the&#xa0;wind-dependent <italic>C<sub>d</sub>
</italic>. This new predictor called the Net Energy Gain Rate (<italic>NGR</italic>), improved the 24-hour TC intensity prediction by 16% and outperformed traditional POTs, which are generally considered the most reliable predictors in statistical-dynamical TC intensity models. <xref ref-type="bibr" rid="B25">Kim S. H. et al. (2022)</xref> explored the impact of a reduced <italic>C<sub>d</sub>
</italic> in high winds on TC intensity, specifically focusing on RI and lifetime maximum intensity. Utilizing the <italic>NGR</italic> as a key&#xa0;metric, the study delved into how each term of <italic>NGR</italic> is influenced by the decrease in <italic>C<sub>d</sub>
</italic>. They found that reduced <italic>C<sub>d</sub>
</italic> in high winds lessens frictional dissipation and limits sea surface cooling, leading to an increase in net energy that significantly influences TC intensification.</p>
<p>In this study, we propose a simple deterministic binary classification model based on popular and primarily used five ML classifiers and ensemble methods to predict an RI event. Each model was trained and tested using the <italic>NGR</italic> which considers wind-dependent <italic>C<sub>d</sub>
</italic> and ocean cooling effect by TC-induced vertical mixing in addition to the widely used predictors. A verification of each model is conducted using the confusion matrix. The results will be compared to the results of the latest studies based on a similar idea and finally show that RI prediction can be used to improve intensity forecasts.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Data and methods</title>
<sec id="s2_1">
<label>2.1</label>
<title>Data</title>
<p>For this research, we used the best track dataset for TCs in WNP with wind speeds of 34 kt or higher. This data was provided by the Joint Typhoon Warning Center (JTWC) and spans from 2004 to 2021. Oceanic variables, specifically SST and DAT, were computed using analysis/reanalysis data from the Hybrid Coordinate Ocean Model and the Navy Coupled Ocean Data Assimilation nowcast/forecast system (HYCOM+NCODA), as provided by the Naval Research Laboratory. DAT values were calculated at varying depths ranging from 10&#xa0;m to 120&#xa0;m, at 10&#xa0;m intervals (DAT<sub>10</sub> through DAT<sub>120</sub>). These values were used to compute various oceanic components such as MPI (MPI<sub>10</sub> to MPI<sub>120</sub>, henceforth referred to as MPIs), POT (POT<sub>10</sub> to POT<sub>120</sub>, henceforth referred to as POTs), OC_PI (OC_PI<sub>10</sub> to OC_PI<sub>120</sub>, henceforth referred to as OC_PIs), and <italic>NGR</italic> (NGR<sub>10</sub> to NGR<sub>120</sub>, henceforth referred to as <italic>NGRs</italic>). Atmospheric variables were obtained from the Global Forecasting System analysis, provided by the National Centers for Environmental Prediction (NCEP), with a spatial resolution of 1&#xb0; x 1&#xb0; and a temporal resolution of 6 hours. The average radius of gale-force winds in WNP is approximately 200&#xa0;km (<xref ref-type="bibr" rid="B24">Kim et&#xa0;al., 2022</xref>). <xref ref-type="bibr" rid="B55">Wang and Toumi (2021)</xref> have identified that the effective radius for TC-induced sea surface cooling is roughly of the same magnitude. To accurately capture the effects caused by a TC, we averaged both oceanic and atmospheric variables within a 200&#xa0;km radius of the TC center. Furthermore, to isolate and remove the influence of the TC from our data, we analyzed conditions from three days before the storm&#x2019;s arrival.</p>
</sec>
<sec id="s2_2">
<label>2.2</label>
<title>
<italic>NGR</italic> and the other predictors</title>
<p>
<italic>NGR</italic> is calculated as the difference between the rate of energy generation (G) and the rate of surface frictional dissipation (D), all within the context of Emanuel&#x2019;s MPI framework. <xref ref-type="bibr" rid="B24">Kim et&#xa0;al. (2022)</xref> showed that <italic>C<sub>d</sub>
</italic> is the most critical factor in determining the magnitude of <italic>NGR</italic>. This <italic>C<sub>d</sub>
</italic> not only significantly influences D but also plays an important role in vertical mixing within the ocean, which in turn affects the saturation enthalpy determined by SST. Therefore, using a more realistic <italic>C<sub>d</sub>
</italic> is crucial for comprehending the mechanisms of TC intensification. In this study, <italic>C<sub>d</sub>
</italic>parameterization from <xref ref-type="bibr" rid="B50">Soloviev et&#xa0;al. (2014)</xref>, based on two-phase parameterization and observations from previous studies, was used.</p>
<p>The <italic>NGR</italic> is computed using Emanuel&#x2019;s software package, with a modification: the SST in the original equation is replaced by DAT. Additionally, the model employs a wind-speed-dependent drag coefficient (<italic>C<sub>d</sub>
</italic>(V)) rather than using a constant drag coefficient.</p>
<p>The equations are as follows:</p>
<disp-formula id="eq1">
<mml:math display="block" id="M1">
<mml:mrow>
<mml:mi>N</mml:mi>
<mml:mi>G</mml:mi>
<mml:mi>R</mml:mi>
<mml:mo>=</mml:mo>
<mml:mi>G</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>D</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>D</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>T</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>o</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>T</mml:mi>
<mml:mi>o</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mfrac>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>k</mml:mi>
</mml:msub>
<mml:mi>&#x3c1;</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msubsup>
<mml:mi>k</mml:mi>
<mml:mi>o</mml:mi>
<mml:mo>*</mml:mo>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>C</mml:mi>
<mml:mi>d</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>V</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>&#x3c1;</mml:mi>
<mml:msup>
<mml:mi>V</mml:mi>
<mml:mn>3</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="eq2">
<mml:math display="block" id="M2">
<mml:mrow>
<mml:mi>D</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>T</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>d</mml:mi>
</mml:mfrac>
<mml:munderover>
<mml:mo>&#x222b;</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>d</mml:mi>
</mml:mrow>
<mml:mn>0</mml:mn>
</mml:munderover>
<mml:mi>T</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mi>z</mml:mi>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>d</mml:mi>
<mml:mi>z</mml:mi>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>DAT</italic> is the depth-averaged temperature (<xref ref-type="bibr" rid="B46">Price, 2009</xref>), <italic>T</italic>
<sub>o</sub> represents the TC outflow temperature, <italic>C<sub>k</sub>
</italic> is the enthalpy coefficient, &#x3c1; is the air density, <italic>k<sub>o</sub>
</italic>
<sup>*</sup> is the sea surface saturation enthalpy, <italic>k</italic> is the surface enthalpy in the TC environment, <italic>C<sub>d</sub>
</italic> is the drag coefficient, and <italic>V</italic> is the surface wind speed.</p>
<p>Higher <italic>NGR</italic> values suggest that more energy is available for TC intensification. Given its superior performance in predicting short-term TC intensification, <italic>NGR</italic> can be used as an ideal predictor for RI events. Its ability to more accurately capture the ocean&#x2019;s contribution to TC intensity changes within a 24-hour range makes it especially suitable for the RI events prediction.</p>
<p>The TC-induced vertical mixing depth is determined by various parameters such as the size, intensity, and translation speed of TC, the Coriolis effect, and the vertical structure of the upper ocean. The depth of this mixing is crucial because it determines the SST where heat exchange occurs during the intensification of TC. <xref ref-type="bibr" rid="B37">Lin et&#xa0;al. (2013)</xref> showed that using an average mixed layer depth of 80&#xa0;m minimizes the bias in the MPI for TCs that are the Saffir-Simpson scale Category 2 or higher. <xref ref-type="bibr" rid="B46">Price (2009)</xref> indicated that 0-100&#xa0;m DAT can adequately represent the mixing caused by major TCs. Meanwhile, LEE19 conducted a sensitivity analysis using the <italic>NGR</italic> for various depths of mixing and showed that fixing the depth at 50&#xa0;m yielded the highest predictive performance for changes in the intensity of the overall TCs. In this study, we took a comprehensive approach to account for the sensitivity of vertical mixing depth and to explore all possible combinations of predictors. We calculated all major predictors, including POT, <italic>NGR</italic>, and OC_PI, based on DATs. These calculations were done at 10-meter intervals up to a depth of 120 meters and were subsequently included in our predictors pool (<xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>).</p>
<table-wrap id="T1" position="float">
<label>Table&#xa0;1</label>
<caption>
<p>List of atmospheric and oceanic potential predictors used to build the machine learning-based RI prediction model.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Predictor</th>
<th valign="top" align="left">Description</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">iWIND</td>
<td valign="top" align="left">Initial max wind speed</td>
</tr>
<tr>
<td valign="top" align="center">DVMX</td>
<td valign="top" align="left">Intensity change during previous 12 h</td>
</tr>
<tr>
<td valign="top" align="center">LON</td>
<td valign="top" align="left">Longitude</td>
</tr>
<tr>
<td valign="top" align="center">LAT</td>
<td valign="top" align="left">Latitude</td>
</tr>
<tr>
<td valign="top" align="center">MOV</td>
<td valign="top" align="left">TC translational speed</td>
</tr>
<tr>
<td valign="top" align="center">RHHI</td>
<td valign="top" align="left">Relative humidity at 500-300 hPa</td>
</tr>
<tr>
<td valign="top" align="center">RHLO</td>
<td valign="top" align="left">Relative humidity at 850-700 hPa</td>
</tr>
<tr>
<td valign="top" align="center">SH200</td>
<td valign="top" align="left">200-850 hPa vertical wind shear</td>
</tr>
<tr>
<td valign="top" align="center">SH500</td>
<td valign="top" align="left">500-850 hPa vertical wind shear</td>
</tr>
<tr>
<td valign="top" align="center">T200</td>
<td valign="top" align="left">Air temperature at 200 hPa</td>
</tr>
<tr>
<td valign="top" align="center">U200</td>
<td valign="top" align="left">Zonal wind at 200 hPa</td>
</tr>
<tr>
<td valign="top" align="center">RV850</td>
<td valign="top" align="left">Relative vorticity at 850 hPa</td>
</tr>
<tr>
<td valign="top" align="center">SST</td>
<td valign="top" align="left">Sea surface temperature</td>
</tr>
<tr>
<td valign="top" align="center">MPI</td>
<td valign="top" align="left">Maximum potential intensity</td>
</tr>
<tr>
<td valign="top" align="center">POT</td>
<td valign="top" align="left">MPI &#x2013; iWIND</td>
</tr>
<tr>
<td valign="top" align="center">OHC</td>
<td valign="top" align="left">Ocean heat content</td>
</tr>
<tr>
<td valign="top" align="center">DAT<italic>
<sub>d</sub>
</italic>
</td>
<td valign="top" align="left">Depth-averaged ocean temperature (<xref ref-type="bibr" rid="B46">Price, 2009</xref>), from 10-120&#xa0;m, 10&#xa0;m interval</td>
</tr>
<tr>
<td valign="top" align="center">OC_PI<italic>
<sub>d</sub>
</italic>
</td>
<td valign="top" align="left">DAT-based MPI (<xref ref-type="bibr" rid="B37">Lin et&#xa0;al., 2013</xref>)</td>
</tr>
<tr>
<td valign="top" align="center">POT<italic>
<sub>d</sub>
</italic>
</td>
<td valign="top" align="left">OC_PI-based POT</td>
</tr>
<tr>
<td valign="top" align="center">NGR<italic>
<sub>d</sub>
</italic>
</td>
<td valign="top" align="left">DAT-based net energy gain rate (<xref ref-type="bibr" rid="B32">Lee et&#xa0;al., 2019</xref>)</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Besides <italic>NGR</italic>, this study incorporates other well-established predictors commonly employed in statistical-dynamical models for TC intensity forecasting by various organizations (<xref ref-type="bibr" rid="B12">DeMaria et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B28">Knaff et&#xa0;al., 2005</xref>; <xref ref-type="bibr" rid="B26">Kim et&#xa0;al., 2018</xref>). In this study, we utilized a total of 65 potential predictors, encompassing a diverse range of factors. These include 5 static predictors, 7 atmospheric synoptic predictors, SST, MPI and the POT derived from it, OHC, and 49 predictors based on the DAT. All these predictors are summarized in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>. To evaluate the impact of <italic>NGR</italic> on the ML-based prediction of RI events, our study uses two distinct sets of these predictors. The first set consists of commonly used predictors related to TC intensity change, as identified in numerous statistical models (in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref>, excluding <italic>NGRs</italic>). The second set incorporates <italic>NGR</italic> into the first set in <xref ref-type="table" rid="T1">
<bold>Table&#xa0;1</bold>
</xref> (as illustrated in <xref ref-type="fig" rid="f1">
<bold>Figure&#xa0;1</bold>
</xref>).</p>
<fig id="f1" position="float">
<label>Figure&#xa0;1</label>
<caption>
<p>The flowchart of machine learning-based RI prediction model development. The dataset is divided into two parts: the training set and the testing set. The training dataset is used to build the machine learning classifiers and the testing data set is used to evaluate the performance. The ensemble classifier for RI prediction is also constructed and evaluated by using the hard-voting method.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1296274-g001.tif"/>
</fig>
</sec>
<sec id="s2_3">
<label>2.3</label>
<title>Implementation of machine learning techniques</title>
<p>In this study, we employ a diverse ensemble of well-known classifiers to predict RI events in the WNP. The ensemble includes a Decision Tree (DT), Logistic Regression (LR), SVM, k-nearest Neighbors (KNN), and Feed Forward Neural Network (FNN). DT serves as a comprehensive data-mining tool, which is adept at generating decision-making rules, identifying patterns, and uncovering knowledge embedded in archived databases (<xref ref-type="bibr" rid="B47">Quinlan, 1987</xref>). More specifically, the DT algorithm evaluates the conduciveness of environmental conditions for RI by systematically checking whether specific environmental predictors satisfy the thresholds set by the trained tree model. LR is used to predict a categorical variable such as the class label (<xref ref-type="bibr" rid="B54">Walker and Duncan, 1967</xref>). It is an extension of linear regression, where the classification problem is converted into a regression problem by estimating the log (odds) of each class in place of probability itself. The model uses the logistic function to squash the output of a linear equation between 0 and 1, making it interpretable as a probability. This method is prized for its simplicity, interpretability, and effectiveness in various domains. The SVM is designed to discover a hyperplane that best separates the data classes (<xref ref-type="bibr" rid="B8">Cortes and Vapnik, 1995</xref>). It achieves this by maximizing the margin between different classes in the feature space. The KNN algorithm makes predictions by storing all training data and identifying the classes of the k closest neighbors to each test sample (<xref ref-type="bibr" rid="B23">Keller et&#xa0;al., 1985</xref>). It aims to classify an unknown sample based on the known classifications of its nearest neighbors. Finally, FNN is a straightforward artificial neural network composed of an input layer and an output layer. The flow of crucial input information in FNN moves strictly from its input layer to its output layer, making the model especially well-suited for parameter identification tasks (<xref ref-type="bibr" rid="B61">Zhang et al., 2022</xref>). Each of these classifiers brings its own set of strengths to the ensemble, contributing to a more robust and reliable RI prediction for the WNP.</p>
<p>To enhance predictability, we employ a hard-voting ensemble method that combines the predictions of the individual classifiers. In this approach, each classifier &#x2018;votes&#x2019; for a class when presented with a test instance. The ensemble then selects the class that receives the majority of votes as its final prediction. By employing this hard-voting scheme, we aim to benefit from the complementary strengths of each classifier, thereby achieving a more robust and accurate model for predicting RI events in the WNP. Given that RI events are not commonly observed, as shown in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>, there is a clear class imbalance in our dataset. To effectively address and rectify this imbalance, we made use of the Synthetic Minority Over-sampling Technique, commonly known as SMOTE (<xref ref-type="bibr" rid="B5">Chawla et&#xa0;al., 2011</xref>). This method effectively tackles the issue of class imbalance in datasets, which is critical in many ML applications. Generating synthetic data for the minority class and creating new data points between existing ones helps balance the dataset. This balance is crucial for training unbiased models and ensuring they effectively learn the characteristics of all classes. This approach ultimately leads to an enhancement in the overall accuracy and performance of the model, making it more reliable for real-world applications. In this study, Principal Component Analysis (PCA) was applied to the pool of predictors to combat multicollinearity within the model. The integration of PCA into our ML-based classification model brought several advantages. It effectively streamlined the dataset by reducing dimensionality, which helped mitigate issues related to the curse of dimensionality and overfitting. This feature reduction also led to improved computational efficiency. Additionally, by focusing on the primary directions of data variance, PCA successfully filtered out noise and irrelevant information, resulting in a more refined dataset (<xref ref-type="bibr" rid="B53">Tefas and Pitas, 2016</xref>). Notably, we only used those principal components that represented at least 99% of the cumulative explained variance as predictors in our model. Given the limited size of our dataset, we employed a 10-fold cross-validation approach, ensuring the selection of the most effective models and preventing overfitting during training. The dataset from 2004 to 2018 was designated for training, while data from 2019 to 2021 was reserved for testing. Within the training data, there were 627 RI cases and 3,388 non-RI cases. Meanwhile, the testing dataset comprised 103 RI cases and 581 non-RI cases, as detailed in <xref ref-type="table" rid="T2">
<bold>Table&#xa0;2</bold>
</xref>.</p>
<table-wrap id="T2" position="float">
<label>Table&#xa0;2</label>
<caption>
<p>The comparison of the number of RI and non-RI cases for training (2004&#x2013;2018) and test (2019&#x2013;2021) period in the western North Pacific.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center"/>
<th valign="middle" align="center">RI case</th>
<th valign="middle" align="center">The number of non-RI</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">Training period<break/>(2004&#x2013;2018)</td>
<td valign="middle" align="center">627</td>
<td valign="middle" align="center">3388</td>
</tr>
<tr>
<td valign="middle" align="center">Test period<break/>(2019&#x2013;2021)</td>
<td valign="middle" align="center">103</td>
<td valign="middle" align="center">581</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2_4">
<label>2.4</label>
<title>Evaluating metrics</title>
<p>In the realm of binary classification models, the evaluation of predictor significance is pivotal for model accuracy and interpretability. Among various statistical measures, Cohen&#x2019;s d is an effective tool for quantifying the discriminative power of predictors. Originally designed to measure the standardized difference between two means in psychological research, Cohen&#x2019;s d can be adapted to assess how individual predictors differentiate between the two classes of the model, typically labeled positive and negative. By calculating the difference in means of a predictor for each class and dividing it by the pooled standard deviation, Cohen&#x2019;s d provides a standardized effect size, facilitating direct and quantifiable comparison of the predictor&#x2019;s impact across different models and datasets. Cohen&#x2019;s d calculated as:</p>
<disp-formula id="eq3">
<mml:math display="block" id="M3">
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mi>M</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where M<sub>1</sub> and M<sub>2</sub> are the means of the predictor values for each of the two classes. <italic>SD<sub>pooled</sub>
</italic>is the pooled standard deviation of the predictor values across both classed. It is computed as:</p>
<disp-formula id="eq4">
<mml:math display="block" id="M4">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:msub>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:msubsup>
<mml:mi>D</mml:mi>
<mml:mn>1</mml:mn>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>+</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:msubsup>
<mml:mi>D</mml:mi>
<mml:mn>2</mml:mn>
<mml:mn>2</mml:mn>
</mml:msubsup>
<mml:mo>&#xd7;</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mi>n</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:math>
</disp-formula>
<p>where <italic>SD<sub>1</sub>
</italic> and <italic>SD<sub>2</sub>
</italic> are the standard deviations for each class, and <italic>n<sub>1</sub>
</italic> and <italic>n<sub>2</sub>
</italic> are the sample sizes. A higher Cohen&#x2019;s d value indicates greater separation between the classes based on the predictor, signifying its importance in the classification task. Typically, Cohen&#x2019;s d values around 0.2 are considered small, around 0.5 medium, and 0.8 or higher, large. This gradation helps in pinpointing the predictors with the most significant roles in distinguishing between classes.</p>
<p>In binary forecasts where models predict an RI event or non-RI event for a training and test set, evaluation metrics comprise elements from a confusion matrix that compare observations to model forecasts (<xref ref-type="table" rid="T3">
<bold>Table&#xa0;3</bold>
</xref>). True Positive (<italic>TP</italic>) is the number of correct forecasts of RI events, whereas False Positive (<italic>FP</italic>) is the number of incorrect forecasts. False Negative (<italic>FN</italic>) is the number where the model did not forecast RI but, RI was observed. True Negative (<italic>TN</italic>) is the number where the model did not forecast RI and RI was not observed.</p>
<table-wrap id="T3" position="float">
<label>Table&#xa0;3</label>
<caption>
<p>Confusion matrix for a binary RI and non-RI classifier.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" rowspan="2" colspan="2" align="center"/>
<th valign="middle" colspan="2" align="center">Observation</th>
</tr>
<tr>
<th valign="middle" align="center">RI</th>
<th valign="middle" align="center">Non-RI</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">Forecast</td>
<td valign="middle" align="center">RI</td>
<td valign="middle" align="center">Hits<break/>
<italic>TP</italic>
</td>
<td valign="middle" align="center">False alarms<break/>
<italic>FP</italic>
</td>
</tr>
<tr>
<td valign="middle" align="center">Non-RI</td>
<td valign="middle" align="center">Misses<break/>
<italic>FN</italic>
</td>
<td valign="middle" align="center">Correct rejects<break/>
<italic>TN</italic>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Accuracy (ACC) is used to measure the overall performance of a binary classifier and is measured as</p>
<disp-formula id="eq5">
<mml:math display="block" id="M5">
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>C</mml:mi>
<mml:mi>C</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>FAR is the number of incorrect forecasts of RI divided by the total number of RI forecasts. FAR is calculated as</p>
<disp-formula id="eq6">
<mml:math display="block" id="M6">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>R</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>POD) is the ratio of the correct forecasts of RI occurrences to the actual number of RI occurrences and is calculated as</p>
<disp-formula id="eq7">
<mml:math display="block" id="M7">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>D</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Precision measures the accuracy of positive predictions in classification problems. It&#x2019;s the ratio of the correct forecasts of RI occurrences to the total number of positive predictions (which includes both <italic>TP</italic> and <italic>FP</italic>). Precision is calculated as</p>
<disp-formula id="eq8">
<mml:math display="block" id="M8">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
<mml:mo>=</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>Peirce skill score (PSS), also known as the Hanssen-Kuipers skill score measures skill relative to an unbiased random reference forecast and is calculated as</p>
<disp-formula id="eq9">
<mml:math display="block" id="M9">
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>S</mml:mi>
<mml:mo>=</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>T</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>F</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#xd7;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mi>P</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>T</mml:mi>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>The F-1 score is a way of combining the precision and POD of the model, and it is defined as the harmonic mean of the model&#x2019;s precision and POD. The F-1 score is calculated as</p>
<disp-formula id="eq10">
<mml:math display="block" id="M10">
<mml:mrow>
<mml:mi>F</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>s</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>&#xd7;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>D</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:mi>D</mml:mi>
<mml:mo>+</mml:mo>
<mml:mi>P</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
<p>A perfect forecast model would achieve an ACC, POD, and PSS score of 1 and a FAR score of 0. In general, higher values of ACC, POD, Precision, PSS and F-1 score, coupled with a lower FAR, indicate superior model performance.</p>
</sec>
</sec>
<sec id="s3" sec-type="results">
<label>3</label>
<title>Results</title>
<sec id="s3_1">
<label>3.1</label>
<title>Characterization of individual predictors</title>
<p>In this section, we examine the classification performance of potential predictors for RI events before developing a classification model. The mean distribution for RI and non-RI classes for each predictor, the effect size of the mean differences between these classes, and the correlation coefficients with the 24-hour intensity change were analyzed (<xref ref-type="table" rid="T4">
<bold>Table&#xa0;4</bold>
</xref>; <xref ref-type="fig" rid="f2">
<bold>Figures&#xa0;2</bold>
</xref>, <xref ref-type="fig" rid="f3">
<bold>3</bold>
</xref>). Excluding DAT-based predictors, the ocean temperature and MPI theory-based predictors (SST, MPI, POT, OHC) exhibited the highest Cohen&#x2019;s d and correlation coefficients. Following these, static predictors such as DVMX and LAT displayed the next highest values of Cohen&#x2019;s d. Synoptic predictors, apart from wind shear-related predictors (SH200, SH500, U200), generally demonstrated lower predictive performance.</p>
<table-wrap id="T4" position="float">
<label>Table&#xa0;4</label>
<caption>
<p>Mean distribution of potential predictors for RI and non-RI events, <italic>p-value</italic> (student <italic>t-test</italic>) and <italic>Cohen&#x2019;s d</italic> of the difference between the two groups.</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="top" align="center">Predictor</th>
<th valign="top" align="center">unit</th>
<th valign="top" align="center">RI</th>
<th valign="top" align="center">non-RI</th>
<th valign="top" align="center">
<italic>p-value</italic>
</th>
<th valign="top" align="center">
<italic>Cohen&#x2019;s d</italic>
</th>
<th valign="top" align="center">
<italic>R</italic>
</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="center">iWIND</td>
<td valign="top" align="center">kt</td>
<td valign="top" align="center">65.9 &#xb1; 21.0</td>
<td valign="top" align="center">73.2 &#xb1; 33.2</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">-0.23</td>
<td valign="top" align="center">-0.39</td>
</tr>
<tr>
<td valign="top" align="center">DVMX</td>
<td valign="top" align="center">kt</td>
<td valign="top" align="center">11.1 &#xb1; 9.5</td>
<td valign="top" align="center">3.1 &#xb1; 11.4</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">
<bold>0.72</bold>
</td>
<td valign="top" align="center">0.36</td>
</tr>
<tr>
<td valign="top" align="center">LON</td>
<td valign="top" align="center">&#xb0;</td>
<td valign="top" align="center">137.0 &#xb1; 10.0</td>
<td valign="top" align="center">136.3 &#xb1; 12.2</td>
<td valign="top" align="center">0.16</td>
<td valign="top" align="center">0.06</td>
<td valign="top" align="center">0.01</td>
</tr>
<tr>
<td valign="top" align="center">LAT</td>
<td valign="top" align="center">&#xb0;</td>
<td valign="top" align="center">16.8 &#xb1; 4.6</td>
<td valign="top" align="center">20.9 &#xb1; 6.8</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">
<bold>-0.62</bold>
</td>
<td valign="top" align="center">-0.36</td>
</tr>
<tr>
<td valign="top" align="center">MOV</td>
<td valign="top" align="center">m s<sup>-1</sup>
</td>
<td valign="top" align="center">5.1 &#xb1; 2.0</td>
<td valign="top" align="center">5.3 &#xb1; 3.1</td>
<td valign="top" align="center">0.11</td>
<td valign="top" align="center">-0.06</td>
<td valign="top" align="center">-0.12</td>
</tr>
<tr>
<td valign="top" align="center">RHHI</td>
<td valign="top" align="center">%</td>
<td valign="top" align="center">54.1 &#xb1; 14.0</td>
<td valign="top" align="center">50.2 &#xb1; 14.9</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">0.26</td>
<td valign="top" align="center">0.17</td>
</tr>
<tr>
<td valign="top" align="center">RHLO</td>
<td valign="top" align="center">%</td>
<td valign="top" align="center">71.2 &#xb1; 7.2</td>
<td valign="top" align="center">68.8 &#xb1; 8.7</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">0.28</td>
<td valign="top" align="center">0.18</td>
</tr>
<tr>
<td valign="top" align="center">SH200</td>
<td valign="top" align="center">m s<sup>-1</sup>
</td>
<td valign="top" align="center">13.5 &#xb1; 4.0</td>
<td valign="top" align="center">15.9 &#xb1; 5.8</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">-0.43</td>
<td valign="top" align="center">-0.36</td>
</tr>
<tr>
<td valign="top" align="center">SH500</td>
<td valign="top" align="center">m s<sup>-1</sup>
</td>
<td valign="top" align="center">5.5 &#xb1; 2.0</td>
<td valign="top" align="center">6.7 &#xb1; 2.7</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">-0.45</td>
<td valign="top" align="center">-0.36</td>
</tr>
<tr>
<td valign="top" align="center">T200</td>
<td valign="top" align="center">K</td>
<td valign="top" align="center">221.3 &#xb1; 1.1</td>
<td valign="top" align="center">221.7 &#xb1; 1.3</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">-0.29</td>
<td valign="top" align="center">-0.13</td>
</tr>
<tr>
<td valign="top" align="center">U200</td>
<td valign="top" align="center">m s<sup>-1</sup>
</td>
<td valign="top" align="center">-2.7 &#xb1; 5.9</td>
<td valign="top" align="center">1.3 &#xb1; 9.4</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">-0.45</td>
<td valign="top" align="center">-0.39</td>
</tr>
<tr>
<td valign="top" align="center">RV850</td>
<td valign="top" align="center">10<sup>-6</sup> s<sup>-1</sup>
</td>
<td valign="top" align="center">3.5 &#xb1; 5.9</td>
<td valign="top" align="center">2.7 &#xb1; 6.8</td>
<td valign="top" align="center">0.003</td>
<td valign="top" align="center">0.12</td>
<td valign="top" align="center">0.13</td>
</tr>
<tr>
<td valign="top" align="center">SST</td>
<td valign="top" align="center">&#xb0;C</td>
<td valign="top" align="center">29.2 &#xb1; 0.7</td>
<td valign="top" align="center">28.4 &#xb1; 1.4</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">
<bold>0.60</bold>
</td>
<td valign="top" align="center">0.45</td>
</tr>
<tr>
<td valign="top" align="center">MPI</td>
<td valign="top" align="center">kt</td>
<td valign="top" align="center">178.8 &#xb1; 15.8</td>
<td valign="top" align="center">159.6 &#xb1; 32.2</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">
<bold>0.76</bold>
</td>
<td valign="top" align="center">0.46</td>
</tr>
<tr>
<td valign="top" align="center">POT</td>
<td valign="top" align="center">kt</td>
<td valign="top" align="center">112.9 &#xb1; 27.6</td>
<td valign="top" align="center">86.4 &#xb1; 46.3</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">
<bold>0.61</bold>
</td>
<td valign="top" align="center">0.60</td>
</tr>
<tr>
<td valign="top" align="center">OHC</td>
<td valign="top" align="center">kJ cm<sup>-2</sup>
</td>
<td valign="top" align="center">78.2 &#xb1; 27.2</td>
<td valign="top" align="center">53.9 &#xb1; 32.8</td>
<td valign="top" align="center">&lt; 0.001</td>
<td valign="top" align="center">
<bold>0.62</bold>
</td>
<td valign="top" align="center">0.41</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>The correlation coefficient indicates the relationship between the predictor and the 24-hour intensity change. Absolute values of Cohen&#x2019;s d greater than 0.5 (medium or greater) are indicated in bold.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<fig id="f2" position="float">
<label>Figure&#xa0;2</label>
<caption>
<p>The comparison of the mean distribution of each class for <bold>(A)</bold> <italic>DAT<sub>d</sub>
</italic>, <bold>(B)</bold> <italic>OC_PI<sub>d</sub>
</italic>, <bold>(C)</bold> <italic>POT<sub>d</sub>
</italic> and <bold>(D)</bold> <italic>NGRd</italic>. The predictors are based on the computed average ocean temperature from the surface down to a depth of 120 meters (in 10-meter intervals) over the period 2004&#x2013;2021. The red (black) solid line and shade indicate the mean value and &#xb1;1 &#x3c3; range of RI (non-RI) class, respectively. Cohen&#x2019;s d values (blue line) show the effect size of mean differences between RI and non-RI classes.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1296274-g002.tif"/>
</fig>
<fig id="f3" position="float">
<label>Figure&#xa0;3</label>
<caption>
<p>The comparison of the correlation coefficients between depth-averaged temperature-based predictors and 24-hour intensity change. The predictors are based on the computed average ocean temperature from the surface down to a depth of 120 meters (in 10-meter intervals) over the period 2004&#x2013;2021. Pentagrams represent the location of the maximum correlation coefficient for each group.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1296274-g003.tif"/>
</fig>
<p>DAT-based predictors demonstrated higher Cohen&#x2019;s d values compared to those derived from traditional SST (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2</bold>
</xref>). For DAT-based predictors, excluding <italic>NGR<sub>d</sub>
</italic>, Cohen&#x2019;s d between the two classes increased progressively with greater mixing depths, peaking at depths of 100-110 meters. <italic>NGR<sub>d</sub>
</italic>, in contrast, displayed a steadily increasing Cohen&#x2019;s d value with depth, reaching a peak at 60 meters and demonstrating a higher Cohen&#x2019;s d value that overshadowed the other potential predictors. <xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref> illustrates distinct patterns of correlation for each predictor as a function of mixing depth, indicating that the relationship between predictors and TC intensity change is sensitive to the mixing depth. Notably, <italic>NGR<sub>d</sub>
</italic> emerges as a superior predictor, with its maximum correlation coefficient occurring at a mixing depth of 60 meters (<xref ref-type="fig" rid="f3">
<bold>Figure&#xa0;3</bold>
</xref>, red line). This is not only higher than those of other predictors but also aligns with the depth where Cohen&#x2019;s d&#x2014;a statistical measure of effect size&#x2014;reaches its peak (<xref ref-type="fig" rid="f2">
<bold>Figure&#xa0;2D</bold>
</xref>, blue line). The consistency of the <italic>NGR<sub>d</sub>
</italic> peak with the maximum of Cohen&#x2019;s d at 60 meters suggests a strong and possibly causal relationship between DATs of this depth and TC intensification rates, as well as RI events. This underscores the value of <italic>NGR<sub>d</sub>
</italic>, based on 60-meter DAT, as a potentially powerful single predictor for anticipating changes in TC intensity, which is crucial for early warning systems and preparedness measures in vulnerable coastal regions.</p>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Assessment of model predictive performance</title>
<p>As outlined in <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref> and <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref>, our study includes a comprehensive summary of the performance metrics &#x2014; POD, PSS, FAR, Precision, ACC, and F-1 score &#x2014; for individual ML models. These were evaluated during the training period running from 2014 to 2018.&#xa0;A modest change emerged when we incorporated <italic>NGRs</italic> into the predictor pools: the metrics of POD, Precision, PSS, F-1 score and ACC generally increased across the models, while the FAR metric correspondingly decreased. The only exception to this was observed in the DT model. This underscores the relevance and value of incorporating <italic>NGRs</italic> into the feature set, as models with <italic>NGRs</italic> consistently outperformed those without. Individually, the <italic>NGR</italic>-based FNN exhibited the highest predictive performance overall, closely followed by the SVM model.</p>
<fig id="f4" position="float">
<label>Figure&#xa0;4</label>
<caption>
<p>Binary confusion metrics of the developed models during the training period: <bold>(A)</bold> DT, <bold>(B)</bold> LR, <bold>(C)</bold> SVM, <bold>(D)</bold> KNN, <bold>(E)</bold> FNN, and <bold>(F)</bold> hard voting ensemble (ENS) of the above models. The red indicates the NGR-based model&#x2019;s outcomes, while the blue shows the performance of the non-NGR model.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1296274-g004.tif"/>
</fig>
<table-wrap id="T5" position="float">
<label>Table&#xa0;5</label>
<caption>
<p>Performance metrics for the individual model and ensemble with <italic>NGR</italic>-based predictors and without <italic>NGR</italic>-based predictors for the training period (2014&#x2013;2018).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Model</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center">POD</th>
<th valign="middle" align="center">FAR</th>
<th valign="top" align="center">Precision</th>
<th valign="middle" align="center">PSS</th>
<th valign="top" align="center">F-1 score</th>
<th valign="middle" align="center">ACC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">DT</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.90</td>
<td valign="middle" align="center">0.23</td>
<td valign="top" align="center">0.77</td>
<td valign="middle" align="center">0.63</td>
<td valign="top" align="center">0.83</td>
<td valign="middle" align="center">81.7%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.20</td>
<td valign="top" align="center">0.80</td>
<td valign="middle" align="center">0.62</td>
<td valign="top" align="center">0.81</td>
<td valign="middle" align="center">81.0%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">LR</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.84</td>
<td valign="middle" align="center">0.29</td>
<td valign="top" align="center">0.71</td>
<td valign="middle" align="center">0.50</td>
<td valign="top" align="center">0.77</td>
<td valign="middle" align="center">74.9%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.82</td>
<td valign="middle" align="center">0.24</td>
<td valign="top" align="center">0.76</td>
<td valign="middle" align="center">0.56</td>
<td valign="top" align="center">0.79</td>
<td valign="middle" align="center">78.1%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">SVM</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.88</td>
<td valign="middle" align="center">0.21</td>
<td valign="top" align="center">0.79</td>
<td valign="middle" align="center">0.64</td>
<td valign="top" align="center">0.83</td>
<td valign="middle" align="center">82.2%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.89</td>
<td valign="middle" align="center">0.21</td>
<td valign="top" align="center">0.79</td>
<td valign="middle" align="center">0.66</td>
<td valign="top" align="center">0.84</td>
<td valign="middle" align="center">83.0%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">KNN</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.94</td>
<td valign="middle" align="center">0.30</td>
<td valign="top" align="center">0.70</td>
<td valign="middle" align="center">0.53</td>
<td valign="top" align="center">0.80</td>
<td valign="middle" align="center">76.5%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.94</td>
<td valign="middle" align="center">0.29</td>
<td valign="top" align="center">0.71</td>
<td valign="middle" align="center">0.56</td>
<td valign="top" align="center">0.81</td>
<td valign="middle" align="center">77.9%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">FNN</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.88</td>
<td valign="middle" align="center">0.17</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.69</td>
<td valign="middle" align="center">0.85</td>
<td valign="middle" align="center">84.5%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.90</td>
<td valign="middle" align="center">0.16</td>
<td valign="top" align="center">0.84</td>
<td valign="middle" align="center">0.73</td>
<td valign="top" align="center">0.87</td>
<td valign="middle" align="center">86.7%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">Ensemble<break/>(hard voting)</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.90</td>
<td valign="middle" align="center">0.21</td>
<td valign="top" align="center">0.79</td>
<td valign="middle" align="center">0.66</td>
<td valign="top" align="center">0.84</td>
<td valign="middle" align="center">82.8%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.93</td>
<td valign="middle" align="center">0.22</td>
<td valign="top" align="center">0.78</td>
<td valign="middle" align="center">0.67</td>
<td valign="top" align="center">0.85</td>
<td valign="middle" align="center">83.6%</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>During the test period of 2019 to 2021, summarized in <xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref> and <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>, the favorable impact of <italic>NGRs</italic> was further corroborated. <italic>NGRs</italic>-based models once again outperformed their counterparts that lacked this feature. This improvement is related to the increase in the number of samples in TN. NGR-based models detected non-RI cases relatively better (<xref ref-type="fig" rid="f5">
<bold>Figure&#xa0;5</bold>
</xref>). Among the individual models, the <italic>NGR</italic>-based SVM emerged as the best performer, particularly in terms of PSS. The consistency of this impact across both training and test periods reaffirms the generalizability and reliability of our methodological approach. An interesting point of divergence between the training and test periods was in the performance indicators. In addressing the class imbalance, oversampling was applied during the training phase. However, this method artificially inflates the TP count. The notable increase in POD and a corresponding decrease in FAR during the training period is attributable to the oversampling technique employed. Because oversampling is not performed in the testing phase, the ratio of RI cases decreases significantly compared to the training phase. This results in a relatively large decrease in TP, which in turn inflates FAR. This highlights the distortion in model performance metrics due to the uneven application of oversampling across training and testing datasets.</p>
<fig id="f5" position="float">
<label>Figure&#xa0;5</label>
<caption>
<p>Same as <xref ref-type="fig" rid="f4">
<bold>Figure&#xa0;4</bold>
</xref>, but for test period.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1296274-g005.tif"/>
</fig>
<table-wrap id="T6" position="float">
<label>Table&#xa0;6</label>
<caption>
<p>Same as <xref ref-type="table" rid="T5"><bold>Table&#xa0;5</bold></xref>, but for the test period (2019&#x2013;2021).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Model</th>
<th valign="middle" align="center"/>
<th valign="middle" align="center">POD</th>
<th valign="middle" align="center">FAR</th>
<th valign="top" align="center">Precision</th>
<th valign="middle" align="center">PSS</th>
<th valign="top" align="center">F-1 score</th>
<th valign="middle" align="center">ACC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" rowspan="2" align="center">DT</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.72</td>
<td valign="middle" align="center">0.71</td>
<td valign="top" align="center">0.29</td>
<td valign="middle" align="center">0.40</td>
<td valign="top" align="center">0.41</td>
<td valign="middle" align="center">68.7%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.77</td>
<td valign="middle" align="center">0.66</td>
<td valign="top" align="center">0.34</td>
<td valign="middle" align="center">0.50</td>
<td valign="top" align="center">0.47</td>
<td valign="middle" align="center">74.1%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">LR</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.83</td>
<td valign="middle" align="center">0.72</td>
<td valign="top" align="center">0.28</td>
<td valign="middle" align="center">0.44</td>
<td valign="top" align="center">0.42</td>
<td valign="middle" align="center">65.1%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.80</td>
<td valign="middle" align="center">0.66</td>
<td valign="top" align="center">0.34</td>
<td valign="middle" align="center">0.52</td>
<td valign="top" align="center">0.47</td>
<td valign="middle" align="center">73.4%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">SVM</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.73</td>
<td valign="middle" align="center">0.62</td>
<td valign="top" align="center">0.38</td>
<td valign="middle" align="center">0.51</td>
<td valign="top" align="center">0.50</td>
<td valign="middle" align="center">77.8%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.76</td>
<td valign="middle" align="center">0.61</td>
<td valign="top" align="center">0.39</td>
<td valign="middle" align="center">0.55</td>
<td valign="top" align="center">0.51</td>
<td valign="middle" align="center">78.4%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">KNN</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.90</td>
<td valign="middle" align="center">0.71</td>
<td valign="top" align="center">0.29</td>
<td valign="middle" align="center">0.52</td>
<td valign="top" align="center">0.44</td>
<td valign="middle" align="center">65.6%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.87</td>
<td valign="middle" align="center">0.70</td>
<td valign="top" align="center">0.30</td>
<td valign="middle" align="center">0.51</td>
<td valign="top" align="center">0.45</td>
<td valign="middle" align="center">67.5%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">FNN</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.64</td>
<td valign="middle" align="center">0.65</td>
<td valign="top" align="center">0.35</td>
<td valign="middle" align="center">0.43</td>
<td valign="top" align="center">0.46</td>
<td valign="middle" align="center">76.9%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.70</td>
<td valign="middle" align="center">0.61</td>
<td valign="top" align="center">0.39</td>
<td valign="middle" align="center">0.51</td>
<td valign="top" align="center">0.50</td>
<td valign="middle" align="center">79.2%</td>
</tr>
<tr>
<td valign="middle" rowspan="2" align="center">Ensemble<break/>(hard voting)</td>
<td valign="middle" align="center">w/o</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.67</td>
<td valign="top" align="center">0.33</td>
<td valign="middle" align="center">0.51</td>
<td valign="top" align="center">0.47</td>
<td valign="middle" align="center">73.1%</td>
</tr>
<tr>
<td valign="middle" align="center">with</td>
<td valign="middle" align="center">0.79</td>
<td valign="middle" align="center">0.62</td>
<td valign="top" align="center">0.38</td>
<td valign="middle" align="center">0.56</td>
<td valign="top" align="center">0.51</td>
<td valign="middle" align="center">77.6%</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>To generate an ensemble forecast, we employ a hard-voting method based on the collective performance metrics of five distinct classifiers. Our ensemble performance metrics for the training and test are shown in <xref ref-type="table" rid="T5">
<bold>Table&#xa0;5</bold>
</xref> and <xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>, respectively. What becomes evident is that integrating <italic>NGRs</italic> into our ensemble model substantially augments its predictive capabilities. This improvement is noticeable during the test period. Notably, the PSS and F-1 score saw a 10% increase when <italic>NGRs</italic> were included in the ensemble model, demonstrating a more skillful forecast (<xref ref-type="table" rid="T6">
<bold>Table&#xa0;6</bold>
</xref>).</p>
<p>To contextualize our ensemble&#x2019;s performance, it is useful to compare it with other contemporary ML-based RI forecasting models. <xref ref-type="bibr" rid="B57">Wei et&#xa0;al. (2023)</xref> presented a deep learning network model called TCNET, which they compared against two Statistical Hurricane Intensity Prediction Schemes (SHIPS)-based models (COR-SHIPS and LLE-SHIPS), along with other models from <xref ref-type="bibr" rid="B60">Yang (2016)</xref>; henceforth referred to as Y16) and <xref ref-type="bibr" rid="B22">Kaplan et&#xa0;al. (2015)</xref>; henceforth referred to as KRD15). <xref ref-type="bibr" rid="B30">Ko et&#xa0;al. (2023)</xref> explored the application of a consensus machine learning (CML) model in TC intensity change forecasting and indicated the CML exhibits better performance on RI predictions compared to the operational models such as SHIPS, GFS. <xref ref-type="bibr" rid="B44">Narayanan et&#xa0;al. (2023)</xref> proposed a simple deterministic binary classification model based on the co-occurrence of environmental parameters (MCE) to predict an RI event. Their results indicated that MCE shows improved skill over the decision tree and logistic regression models, with more accurate RI predictions in the overall testing dataset. The PSS values for these models, displayed in <xref ref-type="fig" rid="f6">
<bold>Figure&#xa0;6</bold>
</xref>, show that our ensemble model (<italic>NGR</italic>-ENS), with a PSS of 0.56 and a POD of 0.79, surpasses all these competing models including TCNET (0.48), MCE (0.40) and CML (0.50). TCNET has the lowest FAR (0.43) followed by CML (0.50), LLE-SHIPS (0.56) and <italic>NGR</italic>-ENS (0.62). This holds even when considering different target periods or datasets. In essence, our ensemble approach fortified by the inclusion of <italic>NGRs</italic> offers superior predictive accuracy for RI events with an advantage of the noticeably high POD rate and the relatively low FAR rate.</p>
<fig id="f6" position="float">
<label>Figure&#xa0;6</label>
<caption>
<p>Performance metric values for the COR-SHIPS (blue), LLE-SHIPS (green), TCNET (purple), Y16 (yellow), KRD15 (brown), MCE (pink), CML (gray) models and the comparisons of NGR-ENS (red) model developed in this study.</p>
</caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmars-10-1296274-g006.tif"/>
</fig>
<p>
<xref ref-type="bibr" rid="B34">Lee et&#xa0;al. (2016)</xref> suggested that the bimodal distribution of lifetime maximum intensity in TCs can be attributed to two distinct types of TC: those that experience RI (RI storms) and those that do not (non-RI storms). They showed that a significant majority&#x2014;79%&#x2014;of major TCs, those classified as category 3 or above, belong to the RI storm. Conversely, only a small fraction&#x2014;6%&#x2014;of non-RI storms ever escalate to become major TCs. Therefore, RI prediction performance in major TCs can represent the overall prediction performance. During the test period (2019 &#x2013;2021), our ensemble model showed noticeable performance improvements when <italic>NGR</italic> was included as a variable (<xref ref-type="table" rid="T7">
<bold>Table&#xa0;7</bold>
</xref>). A recent <italic>C<sub>d</sub>
</italic> parameterization study showed that <italic>C<sub>d</sub>
</italic> decreases after saturating at 33&#xa0;m s<sup>-1</sup>, which leads to an increase in <italic>NGR</italic>, which can induce RI (<xref ref-type="bibr" rid="B24">Kim et&#xa0;al., 2022</xref>). These findings suggest that accurately simulating flux exchanges, especially in storms ranging from categories 1&#x2013;3, can substantially enhance the model&#x2019;s ability to predict RI accurately.</p>
<table-wrap id="T7" position="float">
<label>Table&#xa0;7</label>
<caption>
<p>Performance metrics for the ensemble of five prediction models for major TCs during the test period (2019&#x2013;2021).</p>
</caption>
<table frame="hsides">
<thead>
<tr>
<th valign="middle" align="center">Ensemble</th>
<th valign="middle" align="center">POD</th>
<th valign="middle" align="center">FAR</th>
<th valign="top" align="center">Precision</th>
<th valign="middle" align="center">PSS</th>
<th valign="top" align="center">F-1 score</th>
<th valign="middle" align="center">ACC</th>
</tr>
</thead>
<tbody>
<tr>
<td valign="middle" align="center">w/o <italic>NGRs</italic>
</td>
<td valign="middle" align="center">0.86</td>
<td valign="middle" align="center">0.48</td>
<td valign="top" align="center">0.52</td>
<td valign="middle" align="center">0.61</td>
<td valign="top" align="center">0.65</td>
<td valign="middle" align="center">77.7%</td>
</tr>
<tr>
<td valign="middle" align="center">With <italic>NGRs</italic>
</td>
<td valign="middle" align="center">0.91</td>
<td valign="middle" align="center">0.45</td>
<td valign="top" align="center">0.55</td>
<td valign="middle" align="center">0.68</td>
<td valign="top" align="center">0.69</td>
<td valign="middle" align="center">80.2%</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4">
<label>4</label>
<title>Conclusions and discussions</title>
<p>In this study, the binary RI prediction model by incorporating the <italic>NGR</italic> which was derived using the upper ocean thermal structure of pre-storm ocean and a realistic parameterization of sea surface roughness, into the ML models have been developed for the WNP. Five ML experiments were conducted to predict RI classification predictions, using five ML techniques- DT, LR, SVM, KNN, and FNN-trained with widely used predictors. To investigate the impact of <italic>NGR</italic> on RI prediction, two sets of experiments were conducted for each ML model. In the first set, models were trained only with well-known existing predictors, while in the second set, <italic>NGR</italic> was also included. For the training period, compared with the traditional predictors, the results with the newly used predictors, <italic>NGR</italic>s, in this study show improved skill over all the ML models except for DT. For the test period, all the ML models trained with <italic>NGR</italic>s are, again, better performance with higher POD, PSS, ACC, and lower FAR than the same model but trained without <italic>NGR</italic>s. An ensemble average of the individual five ML models is constructed based on the hard-voting method. We show that the ensemble ML model produces noteworthy improvements for RI in the WNP. The inclusion of the <italic>NGR</italic>s input from the predictor pool in the ensemble model enhances RI prediction performance (PSS) by approximately 10% compared to the ensemble model without <italic>NGR</italic>s. These results suggest that the inclusion of <italic>NGR</italic> contributes to more accurate statistical-dynamical predictions of RI, corroborating previous findings that the <italic>NGR</italic> index better estimates changes in TC intensity in the WNP (LEE19).</p>
<p>In our study, we employed PCA to tackle the challenges associated with a high-dimensional dataset, particularly the risk of overfitting. Overfitting could jeopardize both the model&#x2019;s reliability and its ability to generalize to new data. PCA ameliorated this by compressing the data dimensions while retaining the most important variance, thereby enhancing the model&#x2019;s reliability. In this study, we checked the performance of the prediction model with and without PCA to confirm the improvement in prediction performance through PCA. During the training period, the application of PCA did not significantly impact the predictive performance of the model. However, during the test period, the model that applied PCA showed approximately 10% higher prediction performance than the model that did not apply it (based on NGR-ENS). Using PCA to reduce model overfitting effectively reduces dimensions while retaining key information and eliminating unnecessary noise. This approach prevents the model from being overly optimized for training data, enhancing its generalization ability. PCA lowers the risk of overfitting seen in high-dimensional data when considering all features, which can lead to better performance on both training and testing data. Thus, PCA plays a crucial role in decreasing model complexity and improving predictive capabilities by capturing essential patterns and structures. However, it is worth noting that PCA comes with limitations, such as reduced interpretability due to the transformation of original variables into principal components. This makes it difficult to make intuitive sense of the model&#x2019;s features. Additionally, PCA may overlook non-linear relationships between variables, potentially missing out on important data patterns. Despite these drawbacks, the computational efficiency and reduced risk of overfitting achieved through PCA were indispensable for improving our model&#x2019;s overall reliability and stability.</p>
<p>This study focused on the WNP. To ascertain the broader applicability of these models, they should be trialed in different basins. It is pivotal to understand if the <italic>NGR</italic>-based approach&#x2019;s efficacy remains consistent irrespective of region. The current study employs a 10-m intervals depth-based DAT in <italic>NGR</italic> calculations. A more adaptive approach might involve modulating the depth contingent on real-time TC characteristics like its intensity, speed, latitude, and size. Such dynamism can potentially enhance the precision of the <italic>NGR</italic>, leading to improved predictions. Apart from <italic>NGR</italic>, there might be other indices or predictors that can be tested alongside or against the <italic>NGR</italic> to see which provides the most accurate results. This could lead to a more robust model or a combination of indices for improved RI prediction. The choice of the hard-voting ensemble method was predominantly due to SVM&#x2019;s characteristics. Yet, diversifying into other ensemble strategies, including weighted voting or stacking, may offer a finer prediction approach.</p>
<p>Understanding time series data often unveils serial dependence, where each data point is potentially influenced by its predecessors. This temporal dependency implies that past observations significantly impact present and future values (<xref ref-type="bibr" rid="B4">Box and Pierce, 1970</xref>; <xref ref-type="bibr" rid="B39">Ljung and Box, 1978</xref>). Similarly, in spatial data, we observe a spatial dependency, where the characteristics of a specific location may be influenced by its neighboring areas. Traditional ML models typically struggle with these dependencies. They often assume that data points are independent and identically distributed, an assumption that falls short in the context of time series and spatial data. To better handle these types of data, it&#x2019;s crucial to integrate information about past values in the case of time series (lagged values) and details about neighboring locations in spatial data into the models. This enrichment of the feature set allows the models to acknowledge and utilize these dependencies, enhancing their effectiveness. While advanced deep learning methods, like CNNs and Recurrent Neural Networks (RNNs), provide comprehensive solutions for handling these complexities, simpler adaptations to existing methodologies can also be effective and offer more interpretability. The future of research in this area lies in exploring these strategies to improve the capabilities of models, making them more accurate and reliable in mirroring the dynamics of time series and spatial data. This improvement is particularly relevant for robust and accurate prediction in real-world applications, such as RI prediction. By focusing on these aspects, significant advancements in the robustness and accuracy of RI prediction models are anticipated, enhancing their applicability in practical scenarios.</p>
</sec>
<sec id="s5" sec-type="data-availability">
<title>Data availability statement</title>
<p>TC data can be found on the IBTrACS website (<uri xlink:href="https://www.ncei.noaa.gov/data/international-best-track-archive-for-climate-stewardship-ibtracs/v04r00/access/netcdf/">https://www.ncei.noaa.gov/data/international-best-track-archive-for-climate-stewardship-ibtracs/v04r00/access/netcdf/</uri>), GFS 6-hourly data at <uri xlink:href="https://www.ncei.noaa.gov/data/global-forecast-system/access/">https://www.ncei.noaa.gov/data/global-forecast-system/access/</uri>, HYCOM+NCODA data at <uri xlink:href="https://www.hycom.org/dataserver/gofs-3pt1/analysis">https://www.hycom.org/dataserver/gofs-3pt1/analysis</uri>.</p>
</sec>
<sec id="s6" sec-type="author-contributions">
<title>Author contributions</title>
<p>S-HK: Conceptualization, Data curation, Formal analysis, Methodology, Writing &#x2013; original draft, Writing &#x2013; review &amp; editing. WL: Conceptualization, Formal analysis, Methodology, Validation, Writing &#x2013; review &amp; editing. H-WK: Formal analysis, Supervision, Validation, Writing &#x2013; review &amp; editing. SK: Supervision, Validation, Writing &#x2013; review &amp; editing.</p>
</sec>
</body>
<back>
<sec id="s7" sec-type="funding-information">
<title>Funding</title>
<p>The author(s) declare financial support was received for the research, authorship, and/or publication of this article. This research was a part of the project titled &#x201c;Study on Northwestern Pacific warming and genesis and rapid intensification of typhoon&#x201d;, funded by the Ministry of Oceans and Fisheries, Korea (20220566). This work was also funded by the Korea Meteorological Administration Research and Development Program &#x201c;Development of Asian Dust and Haze Monitoring and Prediction Technology&#x201d; under Grant (KMA2018-00521).</p>
</sec>
<sec id="s8" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s9" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors&#xa0;and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online&#xa0;at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmars.2023.1296274/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmars.2023.1296274/full#supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="Table_1.docx" id="ST1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Balaguru</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Foltz</surname> <given-names>G. R.</given-names>
</name>
<name>
<surname>Leung</surname> <given-names>L. R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Increasing magnitude of hurricane rapid intensification in the central and eastern tropical Atlantic</article-title>. <source>Geophys. Res. Lett.</source> <volume>45</volume> (<issue>9</issue>), <fpage>4238</fpage>&#x2013;<lpage>4247</lpage>. doi: <pub-id pub-id-type="doi">10.1029/2018GL077597</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bender</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Ginis</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Tuleya</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Thomas</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Marchok</surname> <given-names>T.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>The operational GFDL coupled hurricane&#x2013;ocean prediction system and a summary of its performance</article-title>. <source>Monthly Weather Rev.</source> <volume>135</volume> (<issue>12</issue>), <fpage>3965</fpage>&#x2013;<lpage>3989</lpage>. doi: <pub-id pub-id-type="doi">10.1175/2007MWR2032.1</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Biswas</surname> <given-names>M. K.</given-names>
</name>
<name>
<surname>Abarca</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Bernardet</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Ginis</surname> <given-names>I.</given-names>
</name>
<name>
<surname>Grell</surname> <given-names>E.</given-names>
</name>
<name>
<surname>Iacono</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <source>Hurricane weather research and forecasting (HWRF) Model: 2017 scientific Documentation (Technical Report)</source> (<publisher-loc>Boulder, CO</publisher-loc>: <publisher-name>National Center for Atmospheric Research and Developmental Testbed Center</publisher-name>).</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Box</surname> <given-names>G. E. P.</given-names>
</name>
<name>
<surname>Pierce</surname> <given-names>D. A.</given-names>
</name>
</person-group> (<year>1970</year>). <article-title>Distribution of residual autocorrelations in autoregressive-integrated moving average time series models</article-title>. <source>J. Am. Statist. Assoc.</source> <volume>65</volume>, <fpage>1509</fpage>&#x2013;<lpage>1526</lpage>. doi: <pub-id pub-id-type="doi">10.1080/01621459.1970.10481180</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chawla</surname> <given-names>N. V.</given-names>
</name>
<name>
<surname>Bowyer</surname> <given-names>K. W.</given-names>
</name>
<name>
<surname>Hall</surname> <given-names>L. O.</given-names>
</name>
<name>
<surname>Kegelmeyer</surname> <given-names>W. P.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>SMOTE: Synthetic minority over-sampling technique</article-title>. <source>J. Artif. Intell. Res.</source> <volume>16</volume>, <fpage>321</fpage>&#x2013;<lpage>357</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chen</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Bryan</surname> <given-names>G. H.</given-names>
</name>
<name>
<surname>Hazelton</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Marks</surname> <given-names>F. D.</given-names>
</name>
<name>
<surname>Fitzpatrick</surname> <given-names>P.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Evaluation and improvement of a TKE-based eddy-diffusivity mass-flux (EDMF) planetary boundary layer scheme in hurricane conditions</article-title>. <source>Weather Forecast</source>. <volume>37</volume> (<issue>6</issue>), <page-range>935&#x2013;951</page-range>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-21-0168.1</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cloud</surname> <given-names>K. A.</given-names>
</name>
<name>
<surname>Reich</surname> <given-names>B. J.</given-names>
</name>
<name>
<surname>Rozoff</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Alessandrini</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Lewis</surname> <given-names>W. E.</given-names>
</name>
<name>
<surname>Delle Monache</surname> <given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A feed forward neural network based on model output statistics for short-term hurricane intensity prediction</article-title>. <source>Weather Forecasting</source> <volume>34</volume> (<issue>4</issue>), <fpage>985</fpage>&#x2013;<lpage>997</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1175/WAF-D-18-0173.1</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cortes</surname> <given-names>C.</given-names>
</name>
<name>
<surname>Vapnik</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Support-vector networks</article-title>. <source>Mach. Learn</source> (<issue>20</issue>), <fpage>273</fpage>&#x2013;<lpage>297</lpage>. doi: <pub-id pub-id-type="doi">10.1007/BF00994018</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Franklin</surname> <given-names>J. L.</given-names>
</name>
<name>
<surname>Onderlinde</surname> <given-names>M. J.</given-names>
</name>
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Operational forecasting of tropical cyclone rapid intensification at the National Hurricane Center</article-title>. <source>Atmosphere</source> <volume>12</volume> (<issue>6</issue>), <fpage>683</fpage>. doi: <pub-id pub-id-type="doi">10.3390/atmos12060683</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Sea surface temperature and the maximum intensity of Atlantic tropical cyclones</article-title>. <source>J. Climate</source> <volume>7</volume> (<issue>9</issue>), <fpage>1324</fpage>&#x2013;<lpage>1334</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0442(1994)007&lt;1324:SSTATM&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>An updated statistical hurricane intensity prediction scheme (SHIPS) for the Atlantic and eastern North Pacific basins</article-title>. <source>Weather Forecasting</source> <volume>14</volume> (<issue>3</issue>), <fpage>326</fpage>&#x2013;<lpage>337</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0434(1999)014&lt;0326:AUSHIP&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Mainelli</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Shay</surname> <given-names>L. K.</given-names>
</name>
<name>
<surname>Knaff</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Further improvements to the statistical hurricane intensity prediction scheme (SHIPS)</article-title>. <source>Weather Forecast.</source> <volume>20</volume> (<issue>4</issue>), <fpage>531</fpage>&#x2013;<lpage>543</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF862.1</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emanuel</surname> <given-names>K. A.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>An air-sea interaction theory for tropical cyclones. Part I: Steady-state maintenance</article-title>. <source>J. Atmospheric Sci.</source> <volume>43</volume> (<issue>6</issue>), <fpage>585</fpage>&#x2013;<lpage>605</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0469(1986)043&lt;0585:AASITF&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emanuel</surname> <given-names>K. A.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>The maximum intensity of hurricanes</article-title>. <source>J. Atmos. Sci.</source> <volume>45</volume> (<issue>7</issue>), <fpage>1143</fpage>&#x2013;<lpage>1155</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0469(1988)045&lt;1143:TMIOH&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emanuel</surname> <given-names>K. A.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Sensitivity of tropical cyclones to surface exchange coefficients and a revised steady-state model incorporating eye dynamics</article-title>. <source>J. Atmospheric Sci.</source> <volume>52</volume> (<issue>22</issue>), <fpage>3969</fpage>&#x2013;<lpage>3976</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0469(1995)052&lt;3969:SOTCTS&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Feng</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Impact of increasing horizontal and vertical resolution during the HWRF hybrid En Var data assimilation on the analysis and prediction of Hurricane Patricia, (2015)</article-title>. <source>Monthly Weather Rev.</source> <volume>149</volume>, <fpage>419</fpage>&#x2013;<lpage>441</lpage>. doi: <pub-id pub-id-type="doi">10.1175/MWR-D-20-0144.1</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Lin</surname> <given-names>I. I.</given-names>
</name>
<name>
<surname>Chiu</surname> <given-names>L. S.</given-names>
</name>
<name>
<surname>Cao</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Improvements in typhoon intensity change classification by incorporating an ocean coupling potential intensity index into decision trees</article-title>. <source>Weather Forecasting</source> <volume>31</volume> (<issue>1</issue>), <fpage>95</fpage>&#x2013;<lpage>106</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-15-0062.1</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goldenberg</surname> <given-names>S. B.</given-names>
</name>
<name>
<surname>Gopalakrishnan</surname> <given-names>S. G.</given-names>
</name>
<name>
<surname>Tallapragada</surname> <given-names>V.</given-names>
</name>
<name>
<surname>Quirino</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Marks</surname> <given-names>F.</given-names>
<suffix>Jr.</suffix>
</name>
<name>
<surname>Trahan</surname> <given-names>S.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>The 2012 triply nested, high-resolution operational version of the Hurricane Weather Research and Forecasting Model (HWRF): Track and intensity forecast verifications</article-title>. <source>Weather Forecasting</source> <volume>30</volume> (<issue>3</issue>), <fpage>710</fpage>&#x2013;<lpage>729</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-14-00098.1</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Griffin</surname> <given-names>S. M.</given-names>
</name>
<name>
<surname>Wimmers</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Velden</surname> <given-names>C. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Predicting rapid intensification in North Atlantic and eastern North Pacific tropical cyclones using a convolutional neural network</article-title>. <source>Weather Forecasting</source> <volume>37</volume> (<issue>8</issue>), <fpage>1333</fpage>&#x2013;<lpage>1355</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-21-0194.1</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Large-scale characteristics of rapidly intensifying tropical cyclones in the North Atlantic basin</article-title>. <source>Weather forecasting</source> <volume>18</volume> (<issue>6</issue>), <fpage>1093</fpage>&#x2013;<lpage>1108</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0434(2003)018&lt;1093:LCORIT&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Knaff</surname> <given-names>J. A.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>A revised tropical cyclone rapid intensification index for the Atlantic and Eastern North Pacific Basins</article-title>. <source>Weather Forecast.</source> <volume>25</volume> (<issue>1</issue>), <fpage>220</fpage>&#x2013;<lpage>241</lpage>. doi: <pub-id pub-id-type="doi">10.1175/2009WAF2222280.1</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kaplan</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Rozoff</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sampson</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>Kossin</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Velden</surname> <given-names>C. S.</given-names>
</name>
<etal/>
</person-group>. (<year>2015</year>). <article-title>Evaluating environmental impacts on tropical cyclone rapid intensification predictability utilizing statistical models</article-title>. <source>Weather Forecasting</source> <volume>30</volume> (<issue>5</issue>), <fpage>1374</fpage>&#x2013;<lpage>1396</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-15-0032.1</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keller</surname> <given-names>J. M.</given-names>
</name>
<name>
<surname>Gray</surname> <given-names>M. R.</given-names>
</name>
<name>
<surname>Givens</surname> <given-names>J. A.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>A fuzzy k-nearest neighbor algorithm</article-title>. <source>IEEE Trans. systems man cybernetics</source> <volume>4)</volume>, <fpage>580</fpage>&#x2013;<lpage>585</lpage>. doi: <pub-id pub-id-type="doi">10.1109/TSMC.1985.6313426</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>H. J.</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>I. J.</given-names>
</name>
<name>
<surname>Oh</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Comparison of tropical cyclone wind radius&#xa0;estimates between the KMA, RSMC tokyo, and JTWC</article-title>. <source>Asia-Pac J. Atmos Sci.</source> <volume>58</volume>, <fpage>563</fpage>&#x2013;<lpage>576</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s13143-022-00274-5</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>H. W.</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>I. J.</given-names>
</name>
<name>
<surname>Kang</surname> <given-names>S. K.</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>P. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Effects of the reduced air-sea drag coefficient in high winds on the rapid intensification of tropical cyclones and bimodality of the lifetime maximum intensity</article-title>. <source>Front. Mar. Sci</source>. <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2022.1032888</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>I. J.</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>P. S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Statistical&#x2013;dynamical typhoon intensity predictions in the Western North Pacific using track pattern clustering and ocean coupling predictors</article-title>. <source>Weather Forecasting</source> <volume>33</volume> (<issue>1</issue>), <fpage>347</fpage>&#x2013;<lpage>365</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-17-0082.1</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Klotzbach</surname> <given-names>P. J.</given-names>
</name>
<name>
<surname>Wood</surname> <given-names>K. M.</given-names>
</name>
<name>
<surname>Schreck</surname> <given-names>C. J.</given-names>
<suffix>III</suffix>
</name>
<name>
<surname>Bowen</surname> <given-names>S. G.</given-names>
</name>
<name>
<surname>Patricola</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Bell</surname> <given-names>M. M.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Trends in global tropical cyclone activity: 1990&#x2013;2021</article-title>. <source>Geophys. Res. Lett.</source> <volume>49</volume> (<issue>6</issue>), <elocation-id>e2021GL095774</elocation-id>. doi: <pub-id pub-id-type="doi">10.1029/2021GL095774</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Knaff</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Sampson</surname> <given-names>C. R.</given-names>
</name>
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>An operational statistical typhoon intensity prediction scheme for the western North Pacific</article-title>. <source>Weather Forecasting</source> <volume>20</volume> (<issue>4</issue>), <fpage>688</fpage>&#x2013;<lpage>699</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF863.1</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Knutson</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Camargo</surname> <given-names>S. J.</given-names>
</name>
<name>
<surname>Chan</surname> <given-names>J. C.</given-names>
</name>
<name>
<surname>Emanuel</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Ho</surname> <given-names>C. H.</given-names>
</name>
<name>
<surname>Kossin</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Tropical cyclones and climate change assessment: Part II: Projected response to anthropogenic warming</article-title>. <source>Bull. Am. Meteorol. Soc.</source> <volume>101</volume> (<issue>3</issue>), <fpage>E303</fpage>&#x2013;<lpage>E322</lpage>. doi: <pub-id pub-id-type="doi">10.1175/BAMS-D-18-0194.1</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ko</surname> <given-names>M. C.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Kubat</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Copalakrishnan</surname> <given-names>S.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>The Development of a consensus machine learning model for hurricane rapid intensification forecasts with hurricane weather research and forecasting (HWRF) data</article-title>. <source>Weather Forecasting</source> <volume>38</volume>, <fpage>1253</fpage>&#x2013;<lpage>1270</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-22-0217.1</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kossin</surname> <given-names>J. P.</given-names>
</name>
<name>
<surname>Knapp</surname> <given-names>K. R.</given-names>
</name>
<name>
<surname>Olander</surname> <given-names>T. L.</given-names>
</name>
<name>
<surname>Velden</surname> <given-names>C. S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Global increase in major tropical cyclone exceedance probability over the past four decades</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>117</volume> (<issue>22</issue>), <fpage>11975</fpage>&#x2013;<lpage>11980</lpage>. doi: <pub-id pub-id-type="doi">10.1073/pnas.1920849117</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Chu</surname> <given-names>P. S.</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>I. J.</given-names>
</name>
<name>
<surname>Soloviev</surname> <given-names>A. V.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>An index to better estimate tropical cyclone intensity change in the western North Pacific</article-title>. <source>Geophys. Res. Lett.</source> <volume>46</volume> (<issue>15</issue>), <fpage>8960</fpage>&#x2013;<lpage>8968</lpage>. doi: <pub-id pub-id-type="doi">10.1029/2019GL083273</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Kim</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Moon</surname> <given-names>I.-J.</given-names>
</name>
<name>
<surname>Bell</surname> <given-names>M. M.</given-names>
</name>
<name>
<surname>Ginis</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>New parameterization of air-sea exchange coefficients and its impact on intensity prediction under major tropical cyclones</article-title>. <source>Front. Mar. Sci.</source> <volume>9</volume>. doi:&#xa0;<pub-id pub-id-type="doi">10.3389/fmars.2022.1046511</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Tippett</surname> <given-names>M. K.</given-names>
</name>
<name>
<surname>Sobel</surname> <given-names>A. H.</given-names>
</name>
<name>
<surname>Camargo</surname> <given-names>S. J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Rapid intensification and the bimodal distribution of tropical cyclone intensity</article-title>. <source>Nat.&#xa0;Commun.</source> <volume>7</volume>, <fpage>10625</fpage>. doi: <pub-id pub-id-type="doi">10.1038/ncomms10625</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Wan</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Huang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>An initialization scheme for&#xa0;weak tropical cyclones in the south China sea</article-title>. <source>J. Meteorol. Res.</source> <volume>35</volume>, <fpage>358</fpage>&#x2013;<lpage>370</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s13351-021-0069-3</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Lan</surname> <given-names>H.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Statistical regression scheme for intensity prediction of tropical cyclones in the Northwestern Pacific</article-title>. <source>Weather Forecasting</source> <volume>33</volume>, <fpage>1299</fpage>&#x2013;<lpage>1315</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-18-0001.1</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lin</surname> <given-names>I. I.</given-names>
</name>
<name>
<surname>Black</surname> <given-names>P.</given-names>
</name>
<name>
<surname>Price</surname> <given-names>J. F.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>C. Y.</given-names>
</name>
<name>
<surname>Chen</surname> <given-names>S. S.</given-names>
</name>
<name>
<surname>Lien</surname> <given-names>C. C.</given-names>
</name>
<etal/>
</person-group>. (<year>2013</year>). <article-title>An ocean coupling potential intensity index for tropical cyclones</article-title>. <source>Geophys. Res. Lett.</source> <volume>40</volume> (<issue>9</issue>), <fpage>1878</fpage>&#x2013;<lpage>1882</lpage>. doi: <pub-id pub-id-type="doi">10.1002/grl.50091</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname> <given-names>Q.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Tong</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Vortex initialization in the NCEP operational hurricane models</article-title>. <source>Atmosphere</source> <volume>11</volume>, <fpage>968</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/atmos11090968</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ljung</surname> <given-names>G.</given-names>
</name>
<name>
<surname>Box</surname> <given-names>G. C.</given-names>
</name>
</person-group> (<year>1978</year>). <article-title>On a measure of lack of fit in time series models</article-title>. <source>Biometrica</source> <volume>65</volume>, <fpage>265</fpage>&#x2013;<lpage>270</lpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1093/biomet/65.2.297</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lu</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Davis</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Improving the Assimilation of enhanced atmospheric motion vectors for hurricane intensity predictions with HWRF</article-title>. <source>Remote Sens.</source> <volume>14</volume>, <fpage>2040</fpage>. doi: <pub-id pub-id-type="doi">10.3390/rs14092040</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Magnusson</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Majumdar</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Emerton</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Richardson</surname> <given-names>D.</given-names>
</name>
<name>
<surname>Alonso-Balmaseda</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Baugh</surname> <given-names>C.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>ECMWF Technical Memorandum No. 888 (European Centre for Medium-Range Weather Forecasts)</article-title>. doi: <pub-id pub-id-type="doi">10.21957/zzxzzygwv</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mercer</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Grimes</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Atlantic tropical cyclone rapid intensification probabilistic forecasts from an ensemble of machine learning methods</article-title>. <source>Proc. Comput. Sci.</source> <volume>114</volume>, <fpage>333</fpage>&#x2013;<lpage>340</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.procs.2017.09.036</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murakami</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Li</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Kitoh</surname> <given-names>A.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Projected increase in tropical cyclones near Hawaii</article-title>. <source>Nat. Climate Change</source> <volume>3</volume> (<issue>8</issue>), <fpage>749</fpage>&#x2013;<lpage>754</lpage>. doi: <pub-id pub-id-type="doi">10.1038/nclimate1890</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Narayanan</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Balaguru</surname> <given-names>K.</given-names>
</name>
<name>
<surname>Xu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Leung</surname> <given-names>L. R.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>A new method for predicting hurricane rapid intensification based on co-occurring environmental parameters</article-title>. <source>Nat. Hazards</source>. doi:&#xa0;<pub-id pub-id-type="doi">10.1007/s11069-023-06100-z</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ooyama</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>1969</year>). <article-title>Numerical simulation of the life cycle of tropical cyclones</article-title>. <source>J.&#xa0;Atmospheric Sci.</source> <volume>26</volume> (<issue>1</issue>), <fpage>3</fpage>&#x2013;<lpage>40</lpage>. doi: <pub-id pub-id-type="doi">10.1175/1520-0469(1969)026&lt;0003:NSOTLC&gt;2.0.CO;2</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Price</surname> <given-names>J. F.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Metrics of hurricane-ocean interaction: vertically-integrated or vertically-averaged ocean temperature</article-title>? <source>Ocean Sci.</source> <volume>5</volume> (<issue>3</issue>), <fpage>351</fpage>&#x2013;<lpage>368</lpage>. doi: <pub-id pub-id-type="doi">10.5194/os-5-351-2009</pub-id>
</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quinlan</surname> <given-names>J. R.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>Simplifying decision trees</article-title>. <source>Int. J. man-machine Stud.</source> <volume>27</volume> (<issue>3</issue>), <fpage>221</fpage>&#x2013;<lpage>234</lpage>. doi: <pub-id pub-id-type="doi">10.1016/S0020-7373(87)80053-6</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rozoff</surname> <given-names>C. M.</given-names>
</name>
<name>
<surname>Kossin</surname> <given-names>J. P.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>New probabilistic forecast models for the&#xa0;prediction of tropical cyclone rapid intensification</article-title>. <source>Weather Forecasting</source> <volume>26</volume> (<issue>5</issue>), <fpage>677</fpage>&#x2013;<lpage>689</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-10-05059.1</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shaiba</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Hahsler</surname> <given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Applying machine learning methods for predicting tropical cyclone rapid intensification events</article-title>. <source>Res. J. Appl. Sciences Eng. Technol.</source> <volume>13</volume> (<issue>8</issue>), <fpage>638</fpage>&#x2013;<lpage>651</lpage>. doi: <pub-id pub-id-type="doi">10.19026/rjaset.13.3050</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Soloviev</surname> <given-names>A. V.</given-names>
</name>
<name>
<surname>Lukas</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Donelan</surname> <given-names>M. A.</given-names>
</name>
<name>
<surname>Haus</surname> <given-names>B. K.</given-names>
</name>
<name>
<surname>Ginis</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>The air-sea interface and surface stress under tropical cyclones</article-title>. <source>Sci. Rep.</source> <volume>4</volume>, <fpage>5306</fpage>. doi: <pub-id pub-id-type="doi">10.1038/srep05306</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname> <given-names>X.</given-names>
</name>
<name>
<surname>Zhu</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Peng</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Guan</surname> <given-names>H.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Improving multi-model ensemble forecasts of tropical cyclone intensity using Bayesian model averaging</article-title>. <source>J. Meteorol. Res.</source> <volume>32</volume> (<issue>5</issue>), <fpage>794</fpage>&#x2013;<lpage>803</lpage>. doi: <pub-id pub-id-type="doi">10.1007/s13351-018-7117-7</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Su</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>L.</given-names>
</name>
<name>
<surname>Jiang</surname> <given-names>J. H.</given-names>
</name>
<name>
<surname>Pai</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zhai</surname> <given-names>A. J.</given-names>
</name>
<etal/>
</person-group>. (<year>2020</year>). <article-title>Applying satellite observations of tropical cyclone internal structures to rapid intensification forecast with machine learning</article-title>. <source>Geophys. Res. Lett.</source> <volume>47</volume> (<issue>17</issue>), <elocation-id>e2020GL089102</elocation-id>. doi: <pub-id pub-id-type="doi">10.1029/2020GL089102</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tefas</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Pitas</surname> <given-names>I.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Principal component analysis</article-title>. <source>Intelligent Syst.</source> <volume>487</volume>.</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Walker</surname> <given-names>S. H.</given-names>
</name>
<name>
<surname>Duncan</surname> <given-names>D. B.</given-names>
</name>
</person-group> (<year>1967</year>). <article-title>Estimation of the probability of an event as a function of several independent variables</article-title>. <source>Biometrika</source> <volume>54</volume> (<issue>1</issue>), <page-range>167&#x2013;179</page-range>.</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>S.</given-names>
</name>
<name>
<surname>Toumi</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Recent tropical cyclone changes inferred from ocean surface temperature cold wakes</article-title>. <source>Sci. Rep.</source> <volume>11</volume>, <fpage>22269</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.1038/s41598-021-01612-9</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Liu</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Mehra</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Tallapragada</surname> <given-names>V.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Improving low-level wind simulations of tropical cyclones by a regional Hurricane Analysis and Forecast System</article-title>. <source>Res. Activities Earth Syst. Model</source>. <publisher-name>Working Group on Numerical Experimentation, WMO</publisher-name>, <publisher-loc>Geneva</publisher-loc>, pp. <page-range>9&#x2013;10</page-range>.</citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Yang</surname> <given-names>R.</given-names>
</name>
<name>
<surname>Sun</surname> <given-names>D.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Investigating tropical cyclone rapid intensification with an advanced artificial intelligence system and gridded reanalysis data</article-title>. <source>Atmosphere</source> <volume>14</volume> (<issue>2</issue>), <fpage>195</fpage>. doi: <pub-id pub-id-type="doi">10.3390/atmos14020195</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Balaguru</surname> <given-names>K.</given-names>
</name>
<name>
<surname>August</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Lalo</surname> <given-names>N.</given-names>
</name>
<name>
<surname>Hodas</surname> <given-names>N.</given-names>
</name>
<name>
<surname>DeMaria</surname> <given-names>M.</given-names>
</name>
<etal/>
</person-group>. (<year>2021</year>). <article-title>Deep learning experiments for tropical cyclone intensity forecasts</article-title>. <source>Weather Forecasting</source> <volume>36</volume> (<issue>4</issue>), <fpage>1453</fpage>&#x2013;<lpage>1470</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-20-0104.1</pub-id>
</citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yamaguchi</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Owada</surname> <given-names>H.</given-names>
</name>
<name>
<surname>Shimada</surname> <given-names>U.</given-names>
</name>
<name>
<surname>Sawada</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Iriguchi</surname> <given-names>T.</given-names>
</name>
<name>
<surname>Musgrave</surname> <given-names>K. D.</given-names>
</name>
<etal/>
</person-group>. (<year>2018</year>). <article-title>Tropical cyclone intensity prediction in the western North Pacific basin using SHIPS and JMA/GSM</article-title>. <source>SOLA</source> <volume>14</volume>, <fpage>138</fpage>&#x2013;<lpage>143</lpage>. doi: <pub-id pub-id-type="doi">10.2151/sola.2018-024</pub-id>
</citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname> <given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>A systematic classification investigation of rapid intensification of atlantic tropical cyclones with the SHIPS database</article-title>. <source>Weather Forecasting</source> <volume>31</volume> (<issue>2</issue>), <fpage>495</fpage>&#x2013;<lpage>513</lpage>. doi: <pub-id pub-id-type="doi">10.1175/WAF-D-15-0029.1</pub-id>
</citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>Y.</given-names>
</name>
<name>
<surname>Zhou</surname> <given-names>X.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Classification of power quality disturbances using visual attention mechanism and feed-forward neural network</article-title>. <source>Measurement</source> <volume>188</volume>, <fpage>110390</fpage>. doi: <pub-id pub-id-type="doi">10.1016/j.measurement.2021.110390</pub-id>
</citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Tong</surname> <given-names>M.</given-names>
</name>
<name>
<surname>Sippel</surname> <given-names>J. A.</given-names>
</name>
<name>
<surname>Mehra</surname> <given-names>A.</given-names>
</name>
<name>
<surname>Zhang</surname> <given-names>B.</given-names>
</name>
<name>
<surname>Wu</surname> <given-names>K.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The impact of stochastic physics-based hybrid GSI/EnKF data assimilation on hurricane forecasts using EMC operation hurricane modeling system</article-title>. <source>Atmosphere</source> <volume>11</volume>, <fpage>801</fpage>. doi:&#xa0;<pub-id pub-id-type="doi">10.3390/atmos11080801</pub-id>
</citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname> <given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname> <given-names>W.</given-names>
</name>
<name>
<surname>Doyle</surname> <given-names>J. J.</given-names>
</name>
<name>
<surname>Maskaitis</surname> <given-names>J.</given-names>
</name>
<name>
<surname>Komaromi</surname> <given-names>W. A.</given-names>
</name>
<name>
<surname>Heming</surname> <given-names>J.</given-names>
</name>
<etal/>
</person-group>. (<year>2023</year>). <article-title>A review of recent advances, (2018-2021) on tropical cyclone intensity change from operational perspectives, Part 1: Dynamical model guidance</article-title>. <source>Trop. Cyclone Res. Rev.</source> <volume>12</volume> (<issue>1</issue>), <fpage>30</fpage>&#x2013;<lpage>49</lpage>. doi: <pub-id pub-id-type="doi">10.1016/j.tcrr.2023.05.004</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>