<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Big Data</journal-id>
<journal-title>Frontiers in Big Data</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Big Data</abbrev-journal-title>
<issn pub-type="epub">2624-909X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">642182</article-id>
<article-id pub-id-type="doi">10.3389/fdata.2021.642182</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Big Data</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Benchmarking of Data-Driven Causality Discovery Approaches in the Interactions of Arctic Sea Ice and Atmosphere</article-title>
<alt-title alt-title-type="left-running-head">Huang et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Arctic Sea Ice Causality Discovery</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Huang</surname>
<given-names>Yiyi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1074989/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kleindessner</surname>
<given-names>Matth&#xe4;us</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Munishkin</surname>
<given-names>Alexey</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Varshney</surname>
<given-names>Debvrat</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Guo</surname>
<given-names>Pei</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/715678/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wang</surname>
<given-names>Jianwu</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/541022/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Department of Hydrology and Atmospheric Sciences, University of Arizona, <addr-line>Tucson</addr-line>, <addr-line>AZ</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Paul G. Allen School of Computer Science and Engineering, University of Washington, <addr-line>Seattle, WA</addr-line>, <country>United States</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>Department of Computer Science and Engineering, University of California Santa Cruz, <addr-line>Santa Cruz</addr-line>, <addr-line>CA</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>Department of Information Systems, University of Maryland, <addr-line>Baltimore</addr-line>, <addr-line>MD</addr-line>, <country>United&#x20;States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/906026/overview">Justin Sheffield</ext-link>, University of Southampton, United&#x20;Kingdom</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/577016/overview">Zachary Langford</ext-link>, Oak Ridge National Laboratory (DOE), United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1213357/overview">James Overland</ext-link>, National Oceanic and Atmospheric Administration (NOAA), United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/709623/overview">Michel Tsamados</ext-link>, University College London, United&#x20;Kingdom</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Jianwu Wang, <email>jianwu@umbc.edu</email>
</corresp>
<fn fn-type="present-address" id="fn1">
<label>
<sup>
<bold>&#x2020;</bold>
</sup>
</label>
<p>
<bold>Present address:</bold> Matth&#x00E4;us Kleindessner, Amazon, Tubingen, Germany</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Data-driven Climate Sciences, a section of the journal Frontiers in Big&#x20;Data</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>24</day>
<month>08</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>4</volume>
<elocation-id>642182</elocation-id>
<history>
<date date-type="received">
<day>15</day>
<month>12</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>02</day>
<month>08</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Huang, Kleindessner, Munishkin, Varshney, Guo and Wang.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Huang, Kleindessner, Munishkin, Varshney, Guo and Wang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>The Arctic sea ice has retreated rapidly in the past few decades, which is believed to be driven by various dynamic and thermodynamic processes in the atmosphere. The newly open water resulted from sea ice decline in turn exerts large influence on the atmosphere. Therefore, this study aims to investigate the causality between multiple atmospheric processes and sea ice variations using three distinct data-driven causality approaches that have been proposed recently: Temporal Causality Discovery Framework Non-combinatorial Optimization <italic>via</italic> Trace Exponential and Augmented lagrangian for Structure learning (NOTEARS) and Directed Acyclic Graph-Graph Neural Networks (DAG-GNN). We apply these three algorithms to 39&#xa0;years of historical time-series data sets, which include 11 atmospheric variables from ERA-5 reanalysis product and passive microwave satellite retrieved sea ice extent. By comparing the causality graph results of these approaches with what we summarized from the literature, it shows that the static graphs produced by NOTEARS and DAG-GNN are relatively reasonable. The results from NOTEARS indicate that relative humidity and precipitation dominate sea ice changes among all variables, while the results from DAG-GNN suggest that the horizontal and meridional wind are more important for driving sea ice variations. However, both approaches produce some unrealistic cause-effect relationships. Additionally, these three methods cannot well detect the delayed impact of one variable on another in the Arctic. It also turns out that the results are rather sensitive to the choice of hyperparameters of the three methods. As a pioneer study, this work paves the way to disentangle the complex causal relationships in the Earth system, by taking the advantage of cutting-edge Artificial Intelligence technologies.</p>
</abstract>
<kwd-group>
<kwd>causality discovery</kwd>
<kwd>time series</kwd>
<kwd>arctic sea ice</kwd>
<kwd>temporal causality discovery framework</kwd>
<kwd>non-combinatorial optimization <italic>via</italic> trace exponential and augmented lagrangian for structure learning</kwd>
<kwd>directed acyclic graph-graph neural networks</kwd>
<kwd>atmosphere-sea ice interactions</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Warming in the Arctic has been much faster than in the rest of the world in both observations and model simulations, a phenomenon known as the Arctic amplification (<xref ref-type="bibr" rid="B34">Holland and Bitz, 2003</xref>; <xref ref-type="bibr" rid="B80">Serreze and Barry, 2011</xref>). Decline in sea ice has occurred in all seasons, which is believed to be the major driver of Arctic amplification. Over the last few decades, Arctic summer sea ice extent has declined by nearly 50% with accelerated retreat in the early 21st century (<xref ref-type="bibr" rid="B79">Serreze and Stroeve, 2015</xref>; <xref ref-type="bibr" rid="B82">Simmonds, 2015</xref>). These dramatic changes in the Arctic sea ice affect a growing community of diverse stakeholders. Accompanying this growing interest is an urgent demand to increase the pace and scope of the advancements in physical understanding and predictive capabilities. As one of the most important components in the Earth System, the atmosphere actively interacts with the sea ice underneath. On the one hand, the sea ice variations are caused by different dynamic and thermodynamic forcings. On the other hand, sea ice decline in turn exerts large influence on the atmosphere. This will further alter the climate patterns in both Arctic and mid-latitudes, which results in more frequent extreme weather events (<xref ref-type="bibr" rid="B17">Cohen et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B83">Simmonds and Govekar, 2014</xref>; <xref ref-type="bibr" rid="B93">Sun et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B105">Yao et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B56">Luo et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B55">Luo et&#x20;al., 2019a</xref>; <xref ref-type="bibr" rid="B57">Luo et&#x20;al., 2019b</xref>). These two-way feedbacks are potentially very important in terms of understanding the Arctic warming in the past and future. In most cases, these connections are highly nonlinear and conditionally constrained (e.g., differ by season or region), making them even more complex. For example, a link between recent winter sea ice decline and mid-latitude cold extremes could be mediated by whether there is a weak gradient of background potential vorticity (<xref ref-type="bibr" rid="B57">Luo et&#x20;al., 2019b</xref>; <xref ref-type="bibr" rid="B56">Luo et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B55">Luo et&#x20;al., 2019a</xref>). Therefore, it is vital to analyze both the sea ice retreat&#x2019;s influence on the atmosphere and vice&#x20;versa.</p>
<p>The traditional way to discover causal relations is to manipulate the value of a variable by using interventions or real-life experiments. All other influencing factors of the target variable can be held fixed, to test whether a manipulation of a potential cause changes the target variable (<xref ref-type="bibr" rid="B62">Nauta et&#x20;al., 2019</xref>). Specifically, the typical approach for assessing causal links in climate study is targeted modeling experiments. Such experiments are often computationally expensive, time-consuming, or even impossible to carry out. More importantly, the large biases and substantial model spread remain in the state-of-the-art climate models (<xref ref-type="bibr" rid="B90">Stocker et&#x20;al., 2013</xref>), which further introduce some unrealistic causal relations. With the current advances in digital sensing and data assimilation, we have entered a period where Earth science tends to be data rich in observations (<xref ref-type="bibr" rid="B66">Overpeck et&#x20;al., 2011</xref>), allowing us to do data-driven causality discovery (<xref ref-type="bibr" rid="B29">Guo et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B109">Zhang et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B62">Nauta et&#x20;al., 2019</xref>). The data-driven causality approach aids scientists in identifying and extracting signals by analyzing statistical properties of purely observational data, which augments targeted model studies and has direct ties to forecasting and prediction. For time-series data, many popular data-driven causality frameworks are proposed such as Granger Causality (<xref ref-type="bibr" rid="B27">Granger, 1969</xref>), PC Momentary Conditional Independence (PCMCI) (<xref ref-type="bibr" rid="B72">Runge et&#x20;al., 2019</xref>), Time Series Models with Independent Noise (TiMINo) (<xref ref-type="bibr" rid="B69">Peters et&#x20;al., 2012</xref>), Additive Non-linear Time Series Model (ANLTSM) (<xref ref-type="bibr" rid="B16">Chu and Glymour, 2008</xref>) and time series Fast Causal Inference (tsFCI) (<xref ref-type="bibr" rid="B24">Entner and Hoyer, 2010</xref>). Several different frameworks for observational analysis have been applied to climate science to provide graphical representations of causal relations. For example, <xref ref-type="bibr" rid="B23">Ebert-Uphoff and Deng (2012)</xref> investigated causal relationships between four prominent modes of atmospheric low-frequency variability in boreal winter using Graphic Models. <xref ref-type="bibr" rid="B60">McGraw and Barnes (2018)</xref> highlighted the Granger Causality by a simple Monte Carlo example. More recently, <xref ref-type="bibr" rid="B88">Song et&#x20;al. (2018)</xref>, <xref ref-type="bibr" rid="B87">Song et&#x20;al. (2019)</xref> demonstrated the Granger causality between El Ni&#xf1;o and the southern oscillation (ENSO) and other climate variables. Some other applications in climate sciences include <xref ref-type="bibr" rid="B15">Chu et&#x20;al. (2005)</xref>; <xref ref-type="bibr" rid="B108">Zerenner et&#x20;al. (2014)</xref>; <xref ref-type="bibr" rid="B40">Hussung et&#x20;al. (2019)</xref>. Among them, the most relevant topic is the connections between Arctic and mid-latitude climate patterns, such as the Arctic drivers of mid-latitude winter circulations (<xref ref-type="bibr" rid="B50">Kretschmer et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B73">Samarasinghe et&#x20;al., 2019</xref>) as well as the impacts of Arctic sea ice on circulations in the North Atlantic Ocean (<xref ref-type="bibr" rid="B91">Strong et&#x20;al., 2009</xref>) and Western Pacific (<xref ref-type="bibr" rid="B58">Matthewman and Magnusdottir, 2011</xref>). However, neither study investigates the relationship between sea ice retreat and the atmospheric dynamic and thermodynamic processes in the Arctic only, which is the focus of this study. It is unclear whether different causality approaches would produce similar results, or whether a particular technique is best suited for this topic as each study employs a different approach. Moreover, it is also valuable to evaluate whether these data-driven causality discovery approaches could capture those conditional and threshold-related connections.</p>
<p>Thus, the overarching goal of this study is to investigate the causality between multiple atmospheric processes and sea ice variations from sub-seasonal to seasonal timescales using data-driven causality approaches. Instead of performing multiple climate model simulations, here we focus solely on an observational-type analysis. Specifically, three distinct data-driven causality approaches, Temporal Causality Discovery Framework (TCDF) (<xref ref-type="bibr" rid="B62">Nauta et&#x20;al., 2019</xref>), Non-combinatorial Optimization via Trace Exponential and Augmented lagrangian for Structure learning (NOTEARS) (<xref ref-type="bibr" rid="B111">Zheng et&#x20;al., 2018</xref>) and Directed Acyclic Graph-Graph Neural Networks (DAG-GNN) (<xref ref-type="bibr" rid="B107">Yu et&#x20;al., 2019</xref>), will be used and compared to determine whether they are suitable for the particular climate study. The main reasons we chose these three approaches are: 1) the three approaches are relatively new (published in 2018 or later) and we have not seen studies applying or evaluating them with climate data; 2) both TCDF and DAG-GNN are deep learning based approaches and deep learning approaches normally can learn nonlinearity from datasets better than traditional machine learning approaches (<xref ref-type="bibr" rid="B74">Schmidhuber, 2015</xref>). Because DAG-GNN is built on top of NOTEARS for nonlinearity mapping, we included NOTEARS to see whether DAG-GNN can do better than NOTEARS for our dataset.</p>
<p>This paper is structured in the following sections. <xref ref-type="sec" rid="s2">Section 2</xref> summarizes the main conclusions from previous studies in terms of causal relations between different atmospheric processes and Arctic sea ice variations; <xref ref-type="sec" rid="s3">Section 3</xref> lists data sets and data pre-processing methods and steps; <xref ref-type="sec" rid="s4">Section 4</xref> introduces three data-driven causality discovery frameworks; <xref ref-type="sec" rid="s5">Section 5</xref> summarizes the results generated by each method and compares those results with a causality graph based on literature review. Finally, <xref ref-type="sec" rid="s6">Section 6</xref> reports the main conclusions and limitations of this&#x20;study.</p>
</sec>
<sec id="s2">
<title>2 Causality Between Atmospheric Processes and Arctic Sea Ice Variations</title>
<p>Due to the two-way interactions between the atmosphere and sea ice, studying causality between them is a challenging but important task, which makes it an area of high interest within polar climate community. The sea ice variations can be caused by different dynamical and thermodynamical processes. Important dynamical processes include anomalous surface wind (<xref ref-type="bibr" rid="B89">Spreen et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B103">Wu et&#x20;al., 2012</xref>), regional atmospheric circulation patterns (<xref ref-type="bibr" rid="B65">Overland and Wang, 2010</xref>; <xref ref-type="bibr" rid="B75">Screen et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B71">Rinke et&#x20;al., 2019</xref>) and abnormal storm activities (<xref ref-type="bibr" rid="B81">Simmonds et&#x20;al., 2008</xref>; <xref ref-type="bibr" rid="B84">Simmonds and Keay, 2009</xref>; <xref ref-type="bibr" rid="B77">Screen et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B86">Simmonds and Rudeva, 2012</xref>; <xref ref-type="bibr" rid="B67">Parkinson and Comiso, 2013</xref>; <xref ref-type="bibr" rid="B83">Simmonds and Rudeva, 2014</xref>). Cloud (<xref ref-type="bibr" rid="B43">Kapsch et&#x20;al., 2013</xref>), radiation (<xref ref-type="bibr" rid="B46">Kay and Gettelman, 2009</xref>; <xref ref-type="bibr" rid="B14">Choi et&#x20;al., 2014</xref>) and precipitation (<xref ref-type="bibr" rid="B7">Boisvert et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B98">Wang et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B114">Marcovecchio et al., 2021</xref>) are the important thermodynamic factors controlling Arctic sea ice trends and variability. On the other hand, sea ice decline in turn exerts large influence on the atmosphere, including cloud (<xref ref-type="bibr" rid="B46">Kay and Gettelman, 2009</xref>; <xref ref-type="bibr" rid="B61">Morrison et&#x20;al., 2018</xref>), surface energy budget (<xref ref-type="bibr" rid="B78">Semmler et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B6">Boisvert et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B5">Boisvert and Stroeve, 2015</xref>), precipitation (<xref ref-type="bibr" rid="B3">Bintanja and Selten, 2014</xref>; <xref ref-type="bibr" rid="B49">Kopec et&#x20;al., 2016</xref>) and large-scale circulation (<xref ref-type="bibr" rid="B12">Chemke et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B47">Kennel and Yulaeva, 2020</xref>). <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> depicts the causal relations between key atmospheric variables and sea ice over the Arctic. The sea ice here represents sea ice coverage and/or sea ice thickness. Note that the processes <italic>a</italic>&#x20;&#x2212; <italic>d</italic> are well-known atmospheric processes, including cloud microphysics, thermodynamics, radiation, climate dynamics, which have been studied over the past few decades. The processes <italic>e</italic>&#x20;&#x2212; <italic>i</italic> are summarized from more recent publications, which are still under investigation by climate scientists. We will explain processes <italic>e</italic>&#x20;&#x2212; <italic>i</italic> in details in the next paragraph.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>The causality graph between key atmospheric variables and sea ice over the Arctic based on literature review. This graph represents the domain knowledge. Note that the processes <italic>a</italic>&#x20;&#x2212; <italic>d</italic> are well-known atmospheric processes, which can be summarized from multiple textbooks. The processes <italic>e</italic>&#x20;&#x2212; <italic>i</italic> are summarized from recent peer-reviewed publications and they are ongoing research. The <italic>sea</italic>_<italic>ice</italic> here represents sea ice coverage and/or sea ice thickness; <italic>GH</italic> is the geopotential height; <italic>RH</italic> is relative humidity; <italic>SLP</italic> means sea level pressure; <italic>u</italic>10<italic>m</italic> and <italic>v</italic>10<italic>m</italic> represents meridional and zonal wind at 10&#xa0;m, respectively; <italic>HFLX</italic> is the sensible plus latent heat flux; <italic>Precip</italic> is the total precipitation; <italic>CW</italic> is the total cloud water path; <italic>CC</italic> is the total cloud cover; <italic>SW</italic> and <italic>LW</italic> represent net shortwave and longwave flux at the surface, respectively.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g001.tif"/>
</fig>
<p>The arrow <italic>e</italic> represents the two-way effect between sea ice and net longwave flux at the surface. Based on global reanalysis (<xref ref-type="bibr" rid="B43">Kapsch et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B51">Lee et&#x20;al., 2017</xref>), surface (<xref ref-type="bibr" rid="B19">Cox et&#x20;al., 2016</xref>) and satellite observations (<xref ref-type="bibr" rid="B38">Huang et&#x20;al., 2017</xref>), as well as model simulations (<xref ref-type="bibr" rid="B42">Kapsch et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B36">Huang et&#x20;al., 2019a</xref>), the downward longwave radiation at the surface dominates surface warming and therefore enhances sea ice melt in winter and spring. The increase in downward longwave flux is a result of an increase in cloudiness and moisture in the Arctic Basin, which is caused by enhanced local evaporation or moisture transport from mid-latitudes (<xref ref-type="bibr" rid="B54">Luo et&#x20;al., 2017</xref>). Positive anomalies of longwave flux in spring and early summer initiate an earlier melt onset, thereby triggering several feedback mechanisms which amplify melt during the succeeding months (<xref ref-type="bibr" rid="B42">Kapsch et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B37">Huang et&#x20;al., 2019b</xref>). The sea ice melt increases the air temperature and thus increases the longwave flux at the surface. The downward shortwave flux, however, appears only important after the melt has started (<xref ref-type="bibr" rid="B43">Kapsch et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B38">Huang et&#x20;al., 2017</xref>). Once the surface albedo is significantly reduced due to sea ice melt, the solar radiation could be absorbed by ocean, which further accelerates ice melt in late spring and summer (<xref ref-type="bibr" rid="B46">Kay and Gettelman, 2009</xref>; <xref ref-type="bibr" rid="B14">Choi et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B42">Kapsch et&#x20;al., 2016</xref>). The feedback between surface net shortwave flux and sea ice, represented by arrow <italic>f</italic> in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, has been confirmed by both model simulations (<xref ref-type="bibr" rid="B42">Kapsch et&#x20;al., 2016</xref>) and satellite observations (<xref ref-type="bibr" rid="B46">Kay and Gettelman, 2009</xref>; <xref ref-type="bibr" rid="B64">Nussbaumer and Pinker, 2012</xref>; <xref ref-type="bibr" rid="B14">Choi et&#x20;al., 2014</xref>). The arrows <italic>g</italic> indicate the interactions between the sea ice variations and atmospheric dynamical processes. A series of studies demonstrated that recent loss of Arctic sea ice is triggered by the atmospheric circulation changes such as a tendency toward a dipole pattern in the mean sea level pressure trend with an increase over the Arctic Ocean and a decrease over Siberia. The Arctic dipole anomaly in summer (<xref ref-type="bibr" rid="B99">Wang et&#x20;al., 2009</xref>), winter (<xref ref-type="bibr" rid="B100">Watanabe et&#x20;al., 2006</xref>) and spring (<xref ref-type="bibr" rid="B44">Kapsch et&#x20;al., 2019</xref>) produces a strong meridional wind (v-component) anomaly that drives more sea ice out of the Arctic Ocean. In addition, this dipole anomaly promotes transport of heat and moisture and thus enhances downward longwave radiation and control the melt onset (<xref ref-type="bibr" rid="B37">Huang et&#x20;al., 2019b</xref>; <xref ref-type="bibr" rid="B44">Kapsch et&#x20;al., 2019</xref>). Moreover, the changes in cyclone occurrence and/or depth during spring (<xref ref-type="bibr" rid="B77">Screen et&#x20;al., 2011</xref>) and summer (<xref ref-type="bibr" rid="B86">Simmonds and Rudeva, 2012</xref>) have preconditioning effects on the sea ice cover and exert a strong influence on the amount of sea ice that survives the melt season. A recent study also pointed out that a stronger anticyclonic circulation over Greenland and the Arctic Ocean in the troposphere may have contributed as much as 60% to the September sea ice extent decline since 1979, by warming and moistening the lower atmosphere (<xref ref-type="bibr" rid="B21">Ding et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B112">Huang et al., 2021</xref>; <xref ref-type="bibr" rid="B113">Luo et al., 2021</xref>). On the other hand, the reduction in Arctic sea ice extent and increase in open water area in late summer are found to directly contribute to a modification of large-scale circulation patterns in the following autumn through the additional heat stored in the Arctic Ocean and released to the atmosphere during the autumn (<xref ref-type="bibr" rid="B65">Overland and Wang, 2010</xref>). The increased 1,000&#x2013;500&#xa0;hPa thickness in autumn produce anomalous easterley zonal wind component (u-component), especially over the north of Alaska and Canada. Moreover, a more meridional flow pattern associated with sea ice reduction have an impact on the mid-latitude weather (<xref ref-type="bibr" rid="B65">Overland and Wang, 2010</xref>). These conclusions are mainly drawn from model simulations (<xref ref-type="bibr" rid="B100">Watanabe et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B71">Rinke et&#x20;al., 2019</xref>), reanalysis and observations (<xref ref-type="bibr" rid="B99">Wang et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B65">Overland and Wang, 2010</xref>; <xref ref-type="bibr" rid="B44">Kapsch et&#x20;al., 2019</xref>). In addition to radiation, the sensible plus latent heat flux also plays an important role in the Arctic energy budget. The increase in the downward moisture flux triggers the melting of the sea ice in spring (<xref ref-type="bibr" rid="B6">Boisvert et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B5">Boisvert and Stroeve, 2015</xref>; <xref ref-type="bibr" rid="B114">Marcovecchio et al., 2021</xref>). Earlier melt onset and loss of sea ice in the spring enhance warming of the ice-free ocean surface, which in turn leads to an increase of evaporation from the surface into the atmosphere in the autumn. This positive feedback between heat flux and sea ice, indicated by arrow <italic>h</italic>, has been confirmed by satellite observations (<xref ref-type="bibr" rid="B6">Boisvert et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B5">Boisvert and Stroeve, 2015</xref>) and model simulations (<xref ref-type="bibr" rid="B36">Huang et&#x20;al., 2019a</xref>) during most months of the year. The arrow <italic>i</italic> represents the influence of precipitation on Arctic sea ice variations. Specifically, the magnitude of precipitation accumulating over the sea ice pack largely determines the depth of the snow layer, which modulates the rate of sea ice growth because of its highly insulating properties (<xref ref-type="bibr" rid="B92">Sturm et&#x20;al., 2002</xref>). The phase of the precipitation falling on the sea ice pack is also important. As rain, it can melt, compact, and densify the snowpack, thus reducing the surface albedo and promoting sea ice melt (<xref ref-type="bibr" rid="B68">Perovich et&#x20;al., 2002</xref>).The recent snowfall decline in summer is essentially caused by changes in precipitation form (snow turning to rain) with very little influence of decreases in total precipitation, which is a result of lower-atmospheric warming. Then the loss of snow-on-ice results in a substantial decrease in the surface albedo over the Arctic Ocean, causing additional surface ice melt by absorbing more solar radiation (<xref ref-type="bibr" rid="B76">Screen and Simmonds, 2012</xref>). These conclusions are mainly drawn from <italic>in-situ</italic> measurements during field campaign (<xref ref-type="bibr" rid="B68">Perovich et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B92">Sturm et&#x20;al., 2002</xref>), global reanalysis products and surface observations (<xref ref-type="bibr" rid="B76">Screen and Simmonds, 2012</xref>; <xref ref-type="bibr" rid="B7">Boisvert et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B98">Wang et&#x20;al., 2019</xref>). The higher precipitation and snowfall could result in a thicker snowpack that allows less heat loss to the atmosphere. More importantly, modeling studies suggest that increases in Arctic precipitation over the 21st century, particularly in late autumn and winter, are due mainly to strongly intensified local surface evaporation (latent heat flux) (<xref ref-type="bibr" rid="B3">Bintanja and Selten, 2014</xref>). Therefore, we believe that Arctic precipitation exerts direct influence on sea ice variations (arrow <italic>i</italic>), while sea ice modulates precipitation mainly through sensible plus latent heat flux (arrows <italic>h</italic>,&#x20;<italic>b</italic>).</p>
<p>Among these studies, very few of them have demonstrated the delayed impact of one variable on another. Specifically, the net shortwave flux at the surface in early summer (May&#x2013;July) is found to enhance sea ice melt with a lag of 1&#x2013;4&#xa0;months (<xref ref-type="bibr" rid="B14">Choi et&#x20;al., 2014</xref>). Moreover, the sea ice condition exhibits the delayed impacts on itself, which is called sea ice anomaly persistence (<xref ref-type="bibr" rid="B28">Guemas et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B20">Cruz-Garc&#xed;a et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B35">Holland et&#x20;al., 2019</xref>). The sea ice anomaly persistence depends on the predictand (area, extent, volume), region, and the initial and target dates, which can be varied from a few days to a few years (<xref ref-type="bibr" rid="B28">Guemas et&#x20;al., 2016</xref>). With sea ice anomaly persistence, there is predictability for the sea ice area in winter but low predictability throughout the rest of the year in peripheral seas. Based on multiple model simulations, the Labrador Sea stands out among the considered regions, with sea ice predictability extending up to 1.5&#xa0;years (<xref ref-type="bibr" rid="B20">Cruz-Garc&#xed;a et&#x20;al., 2019</xref>).</p>
<p>Note that most of studies mentioned above determine the changes in one variable, happening before another one, by applying time series analysis and/or composite analysis based on observations, reanalysis or model output (<xref ref-type="bibr" rid="B68">Perovich et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B92">Sturm et&#x20;al., 2002</xref>; <xref ref-type="bibr" rid="B46">Kay and Gettelman, 2009</xref>; <xref ref-type="bibr" rid="B99">Wang et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B64">Nussbaumer and Pinker, 2012</xref>; <xref ref-type="bibr" rid="B43">Kapsch et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B14">Choi et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B6">Boisvert et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B5">Boisvert and Stroeve, 2015</xref>; <xref ref-type="bibr" rid="B19">Cox et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B38">Huang et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B37">Huang et&#x20;al., 2019b</xref>; <xref ref-type="bibr" rid="B7">Boisvert et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B98">Wang et&#x20;al., 2019</xref>). Among them, some studies use more advanced statistical analysis such as empirical orthogonal function (<xref ref-type="bibr" rid="B100">Watanabe et&#x20;al., 2006</xref>; <xref ref-type="bibr" rid="B65">Overland and Wang, 2010</xref>) and self-organizing map (<xref ref-type="bibr" rid="B44">Kapsch et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B71">Rinke et&#x20;al., 2019</xref>). Other studies assess the causal links through targeted modeling experiments (<xref ref-type="bibr" rid="B3">Bintanja and Selten, 2014</xref>; <xref ref-type="bibr" rid="B42">Kapsch et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B21">Ding et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B36">Huang et&#x20;al., 2019a</xref>; <xref ref-type="bibr" rid="B20">Cruz-Garc&#xed;a et&#x20;al., 2019</xref>), in order to test whether a manipulation of one variable has an impact on others. And most of the studies focus on relationships between only one or two atmospheric processes with changes in Arctic sea ice. Therefore, in this study, we target to provide a more comprehensive analysis about causality between multiple atmospheric processes and sea ice by applying different data-driven causality approaches.</p>
</sec>
<sec id="s3">
<title>3 Data Sets and Data Pre-processing</title>
<p>In this study, we use the total sea ice extent as the Arctic sea ice index. The sea ice extent is defined as the total area in the Arctic with sea ice concentration greater than 15%. The conversion from sea ice concentration to sea ice extent was conducted at daily time scale. Therefore, we obtained the sea ice concentration from the Nimbus-7 SSMR and DMSP SSM/I-SSMIS passive microwave data version 1 (<xref ref-type="bibr" rid="B11">Cavalieri et&#x20;al., 1996</xref>) provided by the National Snow and Ice Data Center. This dataset was generated from brightness temperature data, and provided daily in the polar stereographic projection with a grid box of 25&#xa0;km &#xd7; 25&#xa0;km since October 1978. The uncertainty of sea ice concentration over the Arctic is within &#xb1;5<italic>%</italic> during the winter, when the sea ice is relatively thick and the sea ice concentration is high. During the summer, the uncertainty increases to &#xb1;15<italic>%</italic> when the melt ponds are present (<xref ref-type="bibr" rid="B10">Cavalieri et&#x20;al., 1992</xref>).</p>
<p>The atmospheric variables were obtained from ERA-5 global reanalysis product. ERA-5 was produced using 4D-Var data assimilation in CY41R2 of European Centre for Medium-Range Weather Forecasts (ECMWF)&#x2019;s Integrated Forecast System (IFS), with 137 hybrid sigma/pressure (model) levels in the vertical, with the top level at 0.01&#xa0;hPa (<xref ref-type="bibr" rid="B32">Hersbach et al., 2020</xref>). The ERA-5 reanalysis has been evaluated over the Arctic in the previous studies and it stands out among several global reanalysis products (<xref ref-type="bibr" rid="B26">Graham et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B59">Mayer et&#x20;al., 2019</xref>) as being more consistent with independent observations (<xref ref-type="bibr" rid="B32">Hersbach et&#x20;al., 2020</xref>), which lends credence to the results obtained here in connection with the associations between the variables considered. In this study, the variables used in the causality discovery algorithms are listed in <xref ref-type="table" rid="T1">Table&#x20;1</xref>. For three-dimensional data (geopotential heights and relative humidity), we treat it as a single variable because we would like to filter out the connections between different layers for each variable. The air temperature has been excluded in this study because it exhibits very high correlation with sea ice concentration. The interactions between air temperature and sea ice could be dominant over all other atmospheric processes based on our&#x20;tests.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>The atmospheric and sea ice variables considered in this&#x20;study.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Abbrev.in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>
</th>
<th align="center">Variable</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">GH</td>
<td align="center">Geopotential heights averaged from 200&#xa0;hPa, 500&#xa0;hPa, and 850&#xa0;hPa</td>
</tr>
<tr>
<td align="left">RH</td>
<td align="center">Relative humidity averaged from 1,000&#x2013;300&#xa0;hPa</td>
</tr>
<tr>
<td align="left">SLP</td>
<td align="center">Sea level pressure</td>
</tr>
<tr>
<td align="left">u10&#xa0;m</td>
<td align="center">Zonal (u-component) wind at 10&#xa0;m</td>
</tr>
<tr>
<td align="left">v10&#xa0;m</td>
<td align="center">Meridional (v-component) wind at 10&#xa0;m</td>
</tr>
<tr>
<td align="left">HFLX</td>
<td align="center">Sensible plus latent heat flux</td>
</tr>
<tr>
<td align="left">Precip</td>
<td align="center">Total precipitation</td>
</tr>
<tr>
<td align="left">CC</td>
<td align="center">Total cloud cover</td>
</tr>
<tr>
<td align="left">CW</td>
<td align="center">Total cloud water path</td>
</tr>
<tr>
<td align="left">SW</td>
<td align="center">Net shortwave flux at the surface</td>
</tr>
<tr>
<td align="left">LW</td>
<td align="center">Net longwave flux at the surface</td>
</tr>
<tr>
<td align="left">Sea_ice</td>
<td align="center">Sea ice extent in the Northern Hemisphere</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>All monthly gridded data during 1980&#x2013;2018 have been averaged over the Arctic north of 60&#xb0;N (<xref ref-type="fig" rid="F2">Figure&#x20;2</xref>) using area-weighted method. Therefore, we created the time-series for both sea ice extent and atmospheric variables. We believe that 39&#xa0;years of data should be sufficient to derive causal relationships and draw meaningful conclusions. In addition, most of the observational-based climate studies mentioned in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> used the data during the modern satellite era (1979-present), which is consistent with our studies. Our purpose is to match this time period and to determine whether those algorithms can produce similar results. Under the background of global warming, almost all components in the Earth System changed with time, as a response to increased greenhouse gas emissions. Regressing atmospheric responses against sea ice decline (or the other way around) involves the risk of finding potentially spurious atmosphere-sea ice interactions simply because both variables change across years (<xref ref-type="bibr" rid="B41">Iler et&#x20;al., 2017</xref>). Therefore, it is necessary to detrend the time-series as the climate data is normally nonlinear and nonstationary (<xref ref-type="bibr" rid="B104">Wu et&#x20;al., 2007</xref>). This technique has been widely used in previous climate studies (<xref ref-type="bibr" rid="B101">Weber and Talkner, 2001</xref>; <xref ref-type="bibr" rid="B45">Kawale et&#x20;al., 2013</xref>), including several recent studies about atmosphere-sea ice interactions in the Arctic (<xref ref-type="bibr" rid="B21">Ding et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B38">Huang et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B2">Baxter et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B96">Top&#xe1;l et&#x20;al., 2020</xref>). Moreover, detrending for time-series that is nonstationary is also important in causality discovery methods (<xref ref-type="bibr" rid="B27">Granger, 1969</xref>; <xref ref-type="bibr" rid="B24">Entner and Hoyer, 2010</xref>; <xref ref-type="bibr" rid="B69">Peters et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B72">Runge et&#x20;al., 2019</xref>). Thus, in order to eliminate overall impacts of global warming and seasonality during this 39-year time period, we applied detrending and deseasonalizing for each time-series. Note that we also conducted additional analysis with raw data to show how detrending and deseasonalizing have an impact on our results at the end of <xref ref-type="sec" rid="s5">Section&#x20;5</xref>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>The study area (60&#xb0;N northward). The circle of 60&#xb0;N is marked in red. Depending on the season, sea ice could occur south of 60&#xb0;N.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g002.tif"/>
</fig>
<p>Here we assume the time series is additive and there exist both trend and seasonal components, that is<disp-formula id="e1">
<mml:math id="m1">
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>s</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>.</mml:mo>
</mml:math>
<label>(1)</label>
</disp-formula>Here, the <italic>m</italic>
<sub>
<italic>t</italic>
</sub> indicates the trend component, while the <italic>s</italic>
<sub>
<italic>t</italic>
</sub> represents seasonality component. The time series has been detrended by subtracting the line of best fit from the time-series <italic>m</italic>
<sub>
<italic>t</italic>
</sub>, where the line of best fit was obtained from a linear regression model with the time steps as the predictor. To deseasonalize the time-series, we used averaged seasonal index <italic>s</italic>
<sub>
<italic>t</italic>
</sub> to seasonally adjust the data. The seasonal index were calculated from moving averages with a 12-months seasonal window in this study (<xref ref-type="bibr" rid="B30">Hamilton, 1994</xref>). More details about time series decomposition can be found in <xref ref-type="bibr" rid="B8">Brockwell et&#x20;al. (2016)</xref>. At the end, we only kept the residual component <italic>Y</italic>
<sub>
<italic>t</italic>
</sub>, which fluctuates around zero, that is<disp-formula id="e2">
<mml:math id="m2">
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>.</mml:mo>
</mml:math>
<label>(2)</label>
</disp-formula>Then we normalized <italic>Y</italic>
<sub>
<italic>t</italic>
</sub> using the max-min method so that<disp-formula id="e3">
<mml:math id="m3">
<mml:msub>
<mml:mrow>
<mml:mi>Y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:mn>0,1</mml:mn>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:math>
<label>(3)</label>
</disp-formula>
</p>
</sec>
<sec id="s4">
<title>4&#x20;Data-Driven Causality Discovery Algorithms</title>
<p>In this work, we apply data-driven causal discovery algorithms aiming to find the major causes of the decrease of Arctic sea ice. These algorithms typically assume one process or state, a cause, contributes to the production of another process or state, an effect. The cause is assumed to be partly responsible for the effect, and the effect is partly dependent on the cause. Although it is not necessary that the effect will have a reverse <italic>affect</italic> on the cause. Thus, causal discovery aims to discover direct cause-effect relationships for both instantaneous and delayed causes. Here we will investigate three recently proposed causal discovery algorithms: TCDF (<xref ref-type="bibr" rid="B62">Nauta et&#x20;al., 2019</xref>), NOTEARS (<xref ref-type="bibr" rid="B111">Zheng et&#x20;al., 2018</xref>), and DAG-GNN (<xref ref-type="bibr" rid="B107">Yu et&#x20;al., 2019</xref>). The overall framework of our benchmarking pipeline is shown in <xref ref-type="fig" rid="F3">Figure&#x20;3</xref>. We believe this general framework can help researchers to evaluate their causality discovery approaches in sea ice study and Earth science in general.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The framework of benchmarking causality discovery methods in atmosphere-sea ice study. Note that detrending and deseasonalizing time-series is optional during the input data pre-processing process.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g003.tif"/>
</fig>
<sec id="s4-1">
<title>4.1 Temporal Causality Discovery Framework</title>
<p>The TCDF algorithm (<xref ref-type="bibr" rid="B62">Nauta et&#x20;al., 2019</xref>) is based on attention-based (<xref ref-type="bibr" rid="B106">Yin et&#x20;al., 2016</xref>) Convolutional Neural Networks (CNN). The input to the algorithm is time series data and the output is a causality graph structure with time delay or lag, which is automatically determined by the TCDF algorithm. For our climate sciences problem with data shown in <xref ref-type="table" rid="T1">Table&#x20;1</xref>, the TCDF algorithm takes the measured data of sea ice, relative humidity, and other atmospheric processes (<xref ref-type="table" rid="T1">Table&#x20;1</xref>) in order to build a causality graph for the input data interact with each other. <xref ref-type="fig" rid="F4">Figure&#x20;4</xref> illustrates the architecture of the TCDF method, operating on generic data, where the multi-dimensional time-series data is on the left and the produced causality graph is on the right. There are four steps to learn a Temporal Causal Graph from the time-series data: Time Series Prediction block, Attention Interpretation block, Causal Validation and Delay Discovery blocks as explained in detail in <xref ref-type="bibr" rid="B62">Nauta et&#x20;al. (2019)</xref>. Here we explain the general process of the TCDF algorithm where a more in depth description is in <xref ref-type="sec" rid="s4">section 4</xref> of <xref ref-type="bibr" rid="B62">Nauta et&#x20;al. (2019)</xref>. The first step is that the time-series data is fed into the Time Series Prediction block, which tries to create an internal time-series model that will accurately try to model each atmospheric or atmosphere-sea ice process. Then the Attention Interpretation block takes that hidden model produced by the Time Series Prediction block and tries to verify and validate how accurate the prediction is to the actual data. Then the last two blocks again verify the hidden model from the Time Series Prediction block but now using the verification errors from the Attention Interpretation block in parallel. The two last blocks try to verify the causal and time delay relationships generated from the prediction block with errors generated by the attention block. A detailed explanation is provided in <xref ref-type="bibr" rid="B62">Nauta et&#x20;al. (2019)</xref> and more details on attention-based CNN can be found in <xref ref-type="bibr" rid="B106">Yin et&#x20;al. (2016)</xref>. Also as a side note: for multi-dimensional time-series there are <italic>n</italic> independent attention-based CNNs, all with the same architecture for each time-series&#x20;data.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Architecture of TCDF (<xref ref-type="bibr" rid="B62">Nauta et&#x20;al., 2019</xref>). The figure is an illustrative example of a high level view of how TCDF creates a causal discovery graph with delays (numbers on the edges of the graph) from time-series&#x20;data.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g004.tif"/>
</fig>
<p>The basic structure of TCDF is for time-series prediction as seen in the first step of the framework in <xref ref-type="fig" rid="F4">Figure&#x20;4</xref>. After predicting time-series, the output gives attention scores for the attention interpretation mechanism. Attention CNNs (<xref ref-type="bibr" rid="B106">Yin et&#x20;al., 2016</xref>) is a machine learning method based on using neural networks to help optimize internal automatically picked parameters in the hidden model generated in our case from the Time Series block. In other words, it is a form of self-learning or adaptive optimization (<xref ref-type="bibr" rid="B25">Eveleigh, 1967</xref>; <xref ref-type="bibr" rid="B102">Wei, 2018</xref>) applied to machine learning. The causality validation reads the final result of the attention scores and applies a permutation importance validation method. The permutation importance is a measurement of how much an error will affect the values of a certain attention score when all scores are randomly permuted. The idea is that permuting a time-series attention score removes potential cause and effect relationships and hence the method can detect real versus fake causal relationships. In parallel the attention scores are fed to the delay discovery to learn the potential delay in cause and effect relationships. The delay discovery also employs the permutation importance validation method.</p>
<p>Another major advantage of TCDF is in using a CNN versus a traditional Recurrent Neural Network (RNN), such as a Long Short Term Memory (LSTM), for time-series data. The advantage is that RNNs typically have a vanishing gradient problem: long-term information has to sequentially travel through all the cells before getting to the present processing cell and typically stalls the learning processes, sometimes even preventing any further improvements gained with learning with more data (<xref ref-type="bibr" rid="B33">Hochreiter, 1998</xref>; <xref ref-type="bibr" rid="B94">Tan and Lim, 2019</xref>). This is greatly amplified when the number of layers becomes very deep, typically more than 10 layers (<xref ref-type="bibr" rid="B74">Schmidhuber, 2015</xref>). Though a CNN structure might have this problem as well, it is more common in RNN because it typically needs much more memory and cells than a CNN structure. With more cells to process, there is a greater chance of obtaining the vanishing gradient problem.</p>
</sec>
<sec id="s4-2">
<title>4.2&#x20;Non-combinatorial Optimization <italic>via</italic> Trace Exponential and Augmented lagrangian for Structure learning</title>
<p>The NOTEARS algorithm (<xref ref-type="bibr" rid="B111">Zheng et&#x20;al., 2018</xref>) assumes a linear data generating model of the form<disp-formula id="e4">
<mml:math id="m4">
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:munder>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>:</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2260;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
</mml:munder>
<mml:msub>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
</mml:math>
<label>(4)</label>
</disp-formula>where <italic>W</italic> is the weighted adjacency matrix of the underlying causality graph <italic>G</italic>(<italic>W</italic>), that is <italic>j</italic>&#x20;&#x2192; <italic>i</italic> in <italic>G</italic>(<italic>W</italic>) if and only if <italic>W</italic>
<sub>
<italic>ji</italic>
</sub> &#x2260; 0, and the random variables <italic>N</italic>
<sub>
<italic>i</italic>
</sub> are independent noise variables. Given <italic>n</italic> independent and identically distributed (i.i.d.) observations of the variables <italic>X</italic>
<sub>1</sub>, &#x2026; , <italic>X</italic>
<sub>
<italic>d</italic>
</sub>, written as matrix <bold>X</bold> &#x2208;<sup>
<italic>n</italic>&#xd7;<italic>d</italic>
</sup>, a standard estimator for <italic>W</italic> is the (regularized) least-squares estimator<disp-formula id="e5">
<mml:math id="m5">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x005E;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>g</mml:mi>
<mml:munder>
<mml:mrow>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>min</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo>&#x2208;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munder>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo stretchy="false">&#x2016;</mml:mo>
<mml:mi mathvariant="bold">X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold">X</mml:mi>
<mml:mi>W</mml:mi>
<mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">&#x2016;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3bb;</mml:mi>
<mml:mo stretchy="false">&#x2016;</mml:mo>
<mml:mi>W</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mo stretchy="false">&#x2016;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mspace width="1em"/>
<mml:mi>s</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>j</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>G</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>D</mml:mi>
<mml:mi>A</mml:mi>
<mml:mi>G</mml:mi>
<mml:mo>,</mml:mo>
</mml:math>
<label>(5)</label>
</disp-formula>where <italic>&#x3bb;</italic> &#x2265; 0 is the regularization parameter. This estimator is theoretically well-studied and satisfies desirable properties such as consistency (<xref ref-type="bibr" rid="B97">Van de Geer and B&#xfc;hlmann, 2013</xref>; <xref ref-type="bibr" rid="B53">Loh and B&#xfc;hlmann, 2014</xref>; <xref ref-type="bibr" rid="B1">Aragam et&#x20;al., 2017</xref>). However, due to the non-convex, <italic>combinatorial-like</italic> constraint, optimization problems of the form <xref ref-type="disp-formula" rid="e5">Eq. 5</xref> are NP-hard to solve (<xref ref-type="bibr" rid="B13">Chickering, 1996</xref>), and hence unless the number of variables <italic>d</italic> is very small, heuristics such as local search have to be applied (e.g., <xref ref-type="bibr" rid="B31">Heckerman et&#x20;al., 1995</xref>; <xref ref-type="bibr" rid="B70">Ramsey et&#x20;al., 2017</xref>). The NOTEARS algorithm builds on the insight that<disp-formula id="e6">
<mml:math id="m6">
<mml:mtext>G</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mtext>W</mml:mtext>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mtext>&#x2009;is&#x2009;a&#x2009;DAG</mml:mtext>
<mml:mspace width="0.3333em" class="nbsp"/>
<mml:mspace width="0.3333em" class="nbsp"/>
<mml:mo>&#x21d4;</mml:mo>
<mml:mspace width="0.3333em" class="nbsp"/>
<mml:mspace width="0.3333em" class="nbsp"/>
<mml:mtext>trace</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mo>&#x25e6;</mml:mo>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>d</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
</mml:math>
<label>(6)</label>
</disp-formula>where exp denotes the matrix exponential and &#x25e6; the element-wise product. The characterization (6) allows to treat the optimization problem <xref ref-type="disp-formula" rid="e5">Eq. 5</xref> as an ordinary <italic>continuous</italic> constrained optimization problem and to use any algorithm from the rich literature on continuous optimization to find a locally optimal solution to (5). Concretely, the NOTEARS algorithm applies the augmented Lagrangian method (e.g., <xref ref-type="bibr" rid="B63">Nocedal and Wright, 2006</xref>) to search for a locally optimal solution to<disp-formula id="e7">
<mml:math id="m7">
<mml:mi>a</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>g</mml:mi>
<mml:munder>
<mml:mrow>
<mml:mi>min</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:msup>
<mml:mrow>
<mml:mo>&#x2208;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>d</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:munder>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
<mml:mi>n</mml:mi>
</mml:mrow>
</mml:mfrac>
<mml:mo stretchy="false">&#x2016;</mml:mo>
<mml:mi mathvariant="bold">X</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold">X</mml:mi>
<mml:mi>W</mml:mi>
<mml:msubsup>
<mml:mrow>
<mml:mo stretchy="false">&#x2016;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3bb;</mml:mi>
<mml:mo stretchy="false">&#x2016;</mml:mo>
<mml:mi>W</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mo stretchy="false">&#x2016;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mspace width="1em"/>
<mml:mtext>subject&#x2009;to&#x2009;trace </mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>W</mml:mi>
<mml:mo>&#x25e6;</mml:mo>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>d</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>.</mml:mo>
</mml:math>
<label>(7)</label>
</disp-formula>After applying the augmented Lagrangian method to (7) and obtaining an output <inline-formula id="inf1">
<mml:math id="m8">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo>&#x303;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula>, the final step of the NOTEARS algorithm is to &#x201c;round&#x201d; <inline-formula id="inf2">
<mml:math id="m9">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo>&#x303;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> and to set&#x20;all entries of <inline-formula id="inf3">
<mml:math id="m10">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo>&#x303;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> with absolute value smaller than some threshold <italic>t</italic> to zero. This yields the final output <inline-formula id="inf4">
<mml:math id="m11">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>W</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x005E;&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> of the NOTEARS algorithm.</p>
<p>In summary, the NOTEARS algorithm yields an estimate of the underlying causality graph as well as the strengths of the causal relationships. It does so by assuming a linear data generating model and access to i.i.d. observations and fitting a causal graph to the data. Its advantage over existing approaches is that it formulates the fitting problem in a way that makes it amenable to standard algorithms for continuous optimization. However, in general, the NOTEARS algorithm will still return only a locally optimal solution to the fitting problem, and the assumption of a linear data generating model might restricts its applicability.</p>
</sec>
<sec id="s4-3">
<title>4.3 Directed Acyclic Graph-Graph Neural Networks</title>
<p>DAG-GNN (<xref ref-type="bibr" rid="B107">Yu et&#x20;al., 2019</xref>) can be thought of as an extension to the NOTEARS algorithm (<xref ref-type="bibr" rid="B111">Zheng et&#x20;al., 2018</xref>) in that the proposed method assumes a nonlinear model of the form<disp-formula id="e8">
<mml:math id="m12">
<mml:mi>X</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>Z</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:math>
<label>(8)</label>
</disp-formula>where <italic>Z</italic> is the encoded latent variable of <italic>X</italic>. This can be contrasted to the linear model assumed in NOTEARS<disp-formula id="e9">
<mml:math id="m13">
<mml:mi>X</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msup>
<mml:mi>Z</mml:mi>
<mml:mo>,</mml:mo>
</mml:math>
<label>(9)</label>
</disp-formula>where <xref ref-type="disp-formula" rid="e9">Eq. 9</xref> is a restructured form of <xref ref-type="disp-formula" rid="e4">Eq. 4</xref>. Further, DAG-GNN builds an inference model to encode <italic>Z</italic>, given by<disp-formula id="e10">
<mml:math id="m14">
<mml:mi>Z</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>4</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>f</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>3</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:math>
<label>(10)</label>
</disp-formula>where <italic>f</italic>
<sub>3</sub> and <italic>f</italic>
<sub>4</sub> play a conceptually inverse role for <italic>f</italic>
<sub>2</sub> and <italic>f</italic>
<sub>1</sub> respectively. In particular, this paper assumes <italic>f</italic>
<sub>1</sub>, <italic>f</italic>
<sub>4</sub> to be identity functions and <italic>f</italic>
<sub>2</sub>, <italic>f</italic>
<sub>3</sub> as Multilayer Perceptrons (MLP). Multilayer Perceptrons are feed-forward Artificial Neural Networks with multiple hidden layers. They are trained through stochastic gradient descent and backpropagation and their function (<italic>f</italic>
<sub>2</sub> and <italic>f</italic>
<sub>3</sub> in our case) corresponds to the relation between the input and output variables.</p>
<p>Since an MLP is nonlinear, it should in theory capture any nonlinearities in the data better than NOTEARS which is a linear model. This is further explained in <xref ref-type="fig" rid="F5">Figure&#x20;5</xref> where <inline-formula id="inf5">
<mml:math id="m15">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> is the regenerated form of <italic>X</italic> and MLP has one hidden layer of 64 neurons. Further, DAG-GNN minimizes the following loss function.<disp-formula id="e11">
<mml:math id="m16">
<mml:mtable class="align" columnalign="left">
<mml:mtr>
<mml:mtd columnalign="right">
<mml:munder>
<mml:mrow>
<mml:mi>min</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
</mml:munder>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>&#x3b8;</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#x2212;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>L</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>E</mml:mi>
<mml:mi>L</mml:mi>
<mml:mi>B</mml:mi>
<mml:mi>O</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
<label>(11)</label>
</disp-formula>
<disp-formula id="e12">
<mml:math id="m17">
<mml:mtable class="align" columnalign="left">
<mml:mtr>
<mml:mtd columnalign="right">
<mml:mtext>s.t.&#x2009;</mml:mtext>
</mml:mtd>
<mml:mtd columnalign="left">
<mml:mi>h</mml:mi>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>tr</mml:mtext>
<mml:mrow>
<mml:mo stretchy="false">[</mml:mo>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
<mml:mi>A</mml:mi>
<mml:mo>&#x25e6;</mml:mo>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mo stretchy="false">]</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>m</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mo>,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable>
</mml:math>
<label>(12)</label>
</disp-formula>where the unknowns include the weight matrix <italic>A</italic>, and parameters <italic>&#x3b8;</italic> for Variational Autoencoder (VAE). Further, ELBO is the Evidence Lower Bound of the VAE adopted from (<xref ref-type="bibr" rid="B48">Kingma and Welling, 2014</xref>) and <italic>h</italic>(<italic>A</italic>) is used to solve the augmented Lagrangian as done in (<xref ref-type="bibr" rid="B63">Nocedal and Wright, 2006</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Architecture of DAG-GNN (<xref ref-type="bibr" rid="B107">Yu et&#x20;al., 2019</xref>). <italic>X</italic> is the observed data and <inline-formula id="inf6">
<mml:math id="m18">
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>X</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">&#x005E;&#x302;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> its reconstruction, which is sampled from a factored Gaussian with mean <italic>M</italic>
<sub>
<italic>X</italic>
</sub> and standard deviation <italic>S</italic>
<sub>
<italic>X</italic>
</sub>.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g005.tif"/>
</fig>
<p>So DAG-GNN is a more robust, non-linear model which can learn more complex relationships than NOTEARS. Having an MLP as a backbone it is capable of learning from a large training set, and giving accurate results. Furthermore, autoencoders have been proven to be useful for unsupervised learning and feature extraction. This makes DAG-GNN capable for understanding causal relationships between atmospheric variables.</p>
</sec>
<sec id="s4-4">
<title>4.4 Static Versus Temporal Model</title>
<p>While TCDF requires time series data as input and explicitly models time delay of causal relations, NOTEARS and DAG-GNN assume to be provided i.i.d. observations of the variables. Similarly to other causal discovery studies in climate research (<xref ref-type="bibr" rid="B23">Ebert-Uphoff and Deng, 2012</xref>), we apply the latter two methods in two ways: in the <italic>static model</italic>, we treat the observations of the variables summarized in <xref ref-type="table" rid="T1">Table&#x20;1</xref> at different points in time as i.i.d. observations and directly feed the data into the two methods. Alternatively, in the <italic>temporal model</italic>, we first augment the data set by adding lagged versions of each variable, that is for each variable <italic>X</italic> we additionally consider variables <italic>X</italic>
<sup>1</sup>, <italic>X</italic>
<sup>2</sup>, &#x2026; , <italic>X</italic>
<sup>12</sup>, where <italic>X</italic>
<sup>
<italic>k</italic>
</sup> is a version of the variable <italic>X</italic> that is measured with a lag of <italic>k</italic> time units (in our case: months) compared to <italic>X</italic>. Here, the maximum time lag we consider is 12&#xa0;months since we want to focus on causal links from sub-seasonal to seasonal timescales. We then treat the observations of the various variables at different points in time as i.i.d. observations and run NOTEARS and DAG-GNN, respectively. The graphs produced by these methods, using the augmented data, are assumed to encode the time delay of causal relations. However, in order to obtain a causal graph on the variables of <xref ref-type="table" rid="T1">Table&#x20;1</xref> we generate a &#x201c;reduced&#x201d; temporal graph from these &#x201c;full&#x201d; temporal graphs by connecting two variables <italic>X</italic> and <italic>Y</italic> in the reduced temporal graph whenever any of the variables <italic>X</italic>, <italic>X</italic>
<sup>1</sup>, &#x2026; , <italic>X</italic>
<sup>12</sup> is connected to any of <italic>Y</italic>, <italic>Y</italic>
<sup>1</sup>, &#x2026; , <italic>Y</italic>
<sup>12</sup> in the full temporal graph. The reduced temporal graph is the output of the temporal&#x20;model.</p>
</sec>
</sec>
<sec id="s5">
<title>5 Results</title>
<p>In this section we present some results of the three causal discovery algorithms introduced in <xref ref-type="sec" rid="s4">Section 4</xref>. We study how the causality graphs produced by the three methods depend on the choice of hyperparameters and see that the graphs can be quite different for varying hyperparameters. We work with the normalized Hamming distance (ignoring the edge weights in the graphs produced by NOTEARS or DAG-GNN) and also compare all graphs to the domain knowledge graph (<xref ref-type="fig" rid="F1">Figure&#x20;1</xref>). Note that We do not quantify the strength of causal relationships in the domain knowledge graph, and we evaluate the algorithms in terms of whether they are capable of detecting these causal relationships, but not in terms of estimating the strength of relationships.</p>
<p>In this section, we treat all graphs as unweighted graphs. The normalized Hamming distance is a widely used metric to compare two unweighted graphs on the same set of vertices (<xref ref-type="bibr" rid="B22">Donnat and Holmes, 2018</xref>). Let <italic>A</italic>, <italic>B</italic>&#x20;&#x2208;{0,1}<sup>
<italic>m</italic>&#xd7;<italic>m</italic>
</sup> be the adjacency matrices of two unweighted graphs <italic>G</italic>
<sub>
<italic>A</italic>
</sub>, <italic>G</italic>
<sub>
<italic>B</italic>
</sub> on <italic>m</italic> vertices. The normalized Hamming distance between <italic>G</italic>
<sub>
<italic>A</italic>
</sub> and <italic>G</italic>
<sub>
<italic>B</italic>
</sub> is given by <inline-formula id="inf7">
<mml:math id="m19">
<mml:mi>d</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:msub>
<mml:mrow>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>H</mml:mi>
<mml:mi>D</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo stretchy="false">(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>G</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
<mml:msubsup>
<mml:mrow>
<mml:mo movablelimits="false" form="prefix">&#x2211;</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi>m</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mo stretchy="false">{</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mi>A</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2260;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi>B</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo stretchy="false">}</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>, that is the number of edges that are present in one graph but not in the other, normalized by the number of all possible edges. The normalized Hamming distance between <italic>G</italic>
<sub>
<italic>A</italic>
</sub> and <italic>G</italic>
<sub>
<italic>B</italic>
</sub> is zero if and only if <italic>G</italic>
<sub>
<italic>A</italic>
</sub> and <italic>G</italic>
<sub>
<italic>B</italic>
</sub> coincide, and it is at most one (which happens if one graph is empty, i.e.,&#x20;does not have any edges, and one graph is complete, i.e.,&#x20;any two vertices are connected). In the following, for each of the three causal discovery algorithms introduced in <xref ref-type="sec" rid="s4">Section 4</xref> we compute the normalized Hamming distance between the graphs produced by an algorithm for different values of its hyperparameters. We also compare the graphs to the domain knowledge graph shown in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> which is generated based on current literature.</p>
<sec id="s5-1">
<title>5.1 Causality Discovery Results Based on Temporal Causality Discovery Framework Approach</title>
<p>
<xref ref-type="table" rid="T2">Table&#x20;2</xref> shows the values for the normalized Hamming distance for the TCDF method, which quantifies the similarity of two causality graphs. A smaller number indicates that two causality graphs are more similar to each other. Two hyperparameters that were chosen are the kernel size, which is how many data points are combined together, and the number of hidden layers, which perform nonlinear transformations of the inputs entered into the network. The number of hidden layers corresponds to the number of hidden CNN layers in the TCDF algorithm. It seems that the addition of a hidden layer leads to far worse results and even produces no causality graphs as is the case for when <italic>kernel</italic> &#x3d; 4 and <italic>kernel</italic> &#x3d; 6 for <italic>layer</italic> &#x3d; 1. The kernel size is related to how much the TCDF method lags the variables for the causality study. The default setting for the hyperparameters as shown with <italic>&#x2663;</italic> in <xref ref-type="table" rid="T2">Table&#x20;2</xref> produce TCDF&#x2019;s best result when comparing to the domain knowledge graph, but that is nowhere close to the domain knowledge graph shown in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. It seems that the TCDF method does not produce good results for our Arctic Sea Ice&#x20;data.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Distance matrix with respect to the normalized Hamming distance for TCDF. <italic>&#x2663;</italic> denotes <italic>layer</italic> &#x3d;0, <italic>kernel</italic> &#x3d;4 are the algorithm&#x2019;s default hyperparameters. The bottom row compares to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, with the best values being marked in bold.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left"/>
<th rowspan="2" align="left"/>
<th colspan="6" align="center">
<italic>Temporal</italic>
</th>
</tr>
<tr>
<td align="center">
<italic>layer</italic> &#x3d; 0</td>
<td align="center">
<italic>layer</italic> &#x3d; 0</td>
<td align="center">
<italic>layer</italic> &#x3d; 0</td>
<td align="center">
<italic>layer</italic> &#x3d; 1</td>
<td align="center">
<italic>layer</italic> &#x3d; 1</td>
<td align="center">
<italic>layer</italic> &#x3d; 1</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="center">
<italic>kernel</italic> &#x3d; 2</td>
<td align="center">
<italic>kernel</italic> &#x3d; 4<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">
<italic>kernel</italic> &#x3d; 6</td>
<td align="center">
<italic>kernel</italic> &#x3d; 2</td>
<td align="center">
<italic>kernel</italic> &#x3d; 4</td>
<td align="center">
<italic>kernel</italic> &#x3d; 6</td>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Temporal</italic>
</td>
<td align="left">
<italic>layer</italic> &#x3d; 0, <italic>kernel</italic> &#x3d; 2</td>
<td align="center">0</td>
<td align="center">0.05</td>
<td align="center">0.01</td>
<td align="center">0.02</td>
<td align="center">0.01</td>
<td align="center">0.01</td>
</tr>
<tr>
<td align="left"/>
<td align="left">
<italic>layer</italic> &#x3d; 0, <italic>kernel</italic> &#x3d; 4<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">0.05</td>
<td align="center">0</td>
<td align="center">0.06</td>
<td align="center">0.07</td>
<td align="center">0.06</td>
<td align="center">0.06</td>
</tr>
<tr>
<td align="left"/>
<td align="left">
<italic>layer</italic> &#x3d; 0, <italic>kernel</italic> &#x3d; 6</td>
<td align="center">0.01</td>
<td align="center">0.06</td>
<td align="center">0</td>
<td align="center">0.01</td>
<td align="center">0.01</td>
<td align="center">0.01</td>
</tr>
<tr>
<td align="left"/>
<td align="left">
<italic>layer</italic> &#x3d; 1, <italic>kernel</italic> &#x3d; 2</td>
<td align="center">0.02</td>
<td align="center">0.07</td>
<td align="center">0.01</td>
<td align="center">0</td>
<td align="center">0.02</td>
<td align="center">0.02</td>
</tr>
<tr>
<td align="left"/>
<td align="left">
<italic>layer</italic> &#x3d; 1, <italic>kernel</italic> &#x3d; 4</td>
<td align="center">0.01</td>
<td align="center">0.06</td>
<td align="center">0.01</td>
<td align="center">0.02</td>
<td align="center">0</td>
<td align="center">0</td>
</tr>
<tr>
<td align="left"/>
<td align="left">
<italic>layer</italic> &#x3d; 1, <italic>kernel</italic> &#x3d; 6</td>
<td align="center">0.01</td>
<td align="center">0.06</td>
<td align="center">0.01</td>
<td align="center">0.02</td>
<td align="center">0</td>
<td align="center">0</td>
</tr>
<tr>
<td align="left"/>
<td align="left">Domain knowl</td>
<td align="center">0.35</td>
<td align="center">
<bold>0.33</bold>
</td>
<td align="center">0.34</td>
<td align="center">0.34</td>
<td align="center">
<bold>0.33</bold>
</td>
<td align="center">
<bold>0.33</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s5-1-1">
<title>5.1.1 Comparison Between Temporal Causality Discovery Framework Based Causality Graph and Domain Knowledge Graph</title>
<p>Since the TCDF focuses on time series, only the temporal graph that is closest to the domain knowledge graph is shown (<xref ref-type="fig" rid="F6">Figure&#x20;6</xref>). In general, if the causality graph generated by the algorithm looks similar to <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, we believe that this approach is more capable of capturing the real causal relationships in the Arctic. There is no cause and effect between sea ice and any atmospheric variables. As for the causality within the atmosphere, only a few edges (cause-effect relationships) are generated by the TCDF algorithm. Among them, the feedback between u10&#xa0;m and v10&#xa0;m, as well as the impact of SW on CW are not consistent with domain knowledge.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>The TCDF graph that is closest to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. The temporal graph for <italic>layer</italic> &#x3d;0, <italic>kernel</italic> &#x3d;4.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g006.tif"/>
</fig>
</sec>
</sec>
<sec id="s5-2">
<title>5.2 Causality Discovery Results Based on Non-combinatorial Optimization <italic>via</italic> Trace Exponential and Augmented lagrangian for Structure learning Approach</title>
<p>The NOTEARS algorithm has two hyperparameters <italic>&#x3bb;</italic> &#x2265; 0 and <italic>t</italic>&#x20;&#x2265; 0 as explained in <xref ref-type="sec" rid="s4-2">Section 4.2</xref>: the parameter <italic>&#x3bb;</italic> is the regularization parameter (cf. <xref ref-type="disp-formula" rid="e5">Eq. 5</xref>) and <italic>t</italic> is the threshold for setting edge weights of the preliminary output to zero (cf. end of <xref ref-type="sec" rid="s4-2">Section 4.2</xref>). There is no default value for <italic>&#x3bb;</italic>, but in the main experiment that comes with the NOTEARS code (<xref ref-type="bibr" rid="B111">Zheng et&#x20;al., 2018</xref>), the authors use <italic>&#x3bb;</italic> &#x3d; 0.1 and hence we consider that value to be the default value. Furthermore, we observed that choosing a value larger than 0.1 for <italic>&#x3bb;</italic> often results in an empty graph as the output of NOTEARS. The default value for <italic>t</italic> is <italic>t</italic>&#x20;&#x3d; 0.3. Indeed, we observed that <italic>t</italic>&#x20;&#x3d; 0.3 yields better results when comparing to the domain knowledge graph than other values of&#x20;<italic>t</italic>.</p>
<p>
<xref ref-type="table" rid="T3">Table&#x20;3</xref> shows the normalized Hamming distance between the graphs produced by NOTEARS for <italic>&#x3bb;</italic> &#x2208;{0, 0.1} and <italic>t</italic>&#x20;&#x2208;{0.2, 0.3}, for both the static and the temporal model. The last row of the table shows the normalized Hamming distance between the various graphs and the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. Note that actually none of the graphs considered here is a DAG. We can see that the distances between the various temporal graphs (middle right part of the table) are significantly larger than the distances between the various static graphs (upper left part of the table). We can also see that changing the value of <italic>&#x3bb;</italic> from 0 to 0.1 causes a larger difference in the result than changing the value of <italic>t</italic> from 0.2 to 0.3 (e.g., the normalized Hamming distance between the static model with <italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2 and the static model with <italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3 is only 0.02, while the distance between the static model with <italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2 and the static model with <italic>&#x3bb;</italic> &#x3d; 0.1, <italic>t</italic>&#x20;&#x3d; 0.2 is&#x20;0.15).</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Distance matrix with respect to the normalized Hamming distance for NOTEARS. <italic>&#x2663;</italic> denotes that <italic>&#x3bb;</italic> &#x3d;0.1, <italic>t</italic>&#x20;&#x3d;0.3 are the algorithm&#x2019;s default hyperparameters. The bottom row compares to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, with the best values being marked in bold.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left"/>
<th rowspan="2" align="left"/>
<th colspan="4" align="center">
<italic>Static</italic>
</th>
<th colspan="4" align="center">
<italic>Temporal</italic>
</th>
</tr>
<tr>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Static</italic>
</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.0</td>
<td align="center">0.02</td>
<td align="center">0.15</td>
<td align="center">0.15</td>
<td align="center">0.54</td>
<td align="center">0.36</td>
<td align="center">0.16</td>
<td align="center">0.15</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">0.02</td>
<td align="center">0.0</td>
<td align="center">0.15</td>
<td align="center">0.12</td>
<td align="center">0.53</td>
<td align="center">0.35</td>
<td align="center">0.14</td>
<td align="center">0.12</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.15</td>
<td align="center">0.15</td>
<td align="center">0.0</td>
<td align="center">0.02</td>
<td align="center">0.51</td>
<td align="center">0.36</td>
<td align="center">0.09</td>
<td align="center">0.1</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1, <italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">0.15</td>
<td align="center">0.12</td>
<td align="center">0.02</td>
<td align="center">0.0</td>
<td align="center">0.52</td>
<td align="center">0.35</td>
<td align="center">0.07</td>
<td align="center">0.08</td>
</tr>
<tr>
<td align="left">
<italic>Temporal</italic>
</td>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.54</td>
<td align="center">0.53</td>
<td align="center">0.51</td>
<td align="center">0.52</td>
<td align="center">0.0</td>
<td align="center">0.18</td>
<td align="center">0.48</td>
<td align="center">0.51</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">0.36</td>
<td align="center">0.35</td>
<td align="center">0.36</td>
<td align="center">0.35</td>
<td align="center">0.18</td>
<td align="center">0.0</td>
<td align="center">0.33</td>
<td align="center">0.34</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.16</td>
<td align="center">0.14</td>
<td align="center">0.09</td>
<td align="center">0.07</td>
<td align="center">0.48</td>
<td align="center">0.33</td>
<td align="center">0.0</td>
<td align="center">0.03</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3bb;</italic> &#x3d; 0.1, <italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">0.15</td>
<td align="center">0.12</td>
<td align="center">0.1</td>
<td align="center">0.08</td>
<td align="center">0.51</td>
<td align="center">0.34</td>
<td align="center">0.03</td>
<td align="center">0.0</td>
</tr>
<tr>
<td align="left"/>
<td align="center">Domain knowl.</td>
<td align="center">0.35</td>
<td align="center">
<bold>0.33</bold>
</td>
<td align="center">0.36</td>
<td align="center">0.35</td>
<td align="center">0.54</td>
<td align="center">0.46</td>
<td align="center">0.37</td>
<td align="center">
<bold>0.35</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s5-2-1">
<title>5.2.1 Comparison Between Non-combinatorial Optimization <italic>via</italic> Trace Exponential and Augmented lagrangian for Structure learning Based Causality Graph and Domain Knowledge Graph</title>
<p>In <xref ref-type="fig" rid="F7">Figure&#x20;7</xref>, we show both the static and the temporal graphs that are closest to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. The larger weights in the causality graph indicate a stronger relationship between two variables. Generally, while none of the produced graphs is really close to the domain knowledge graph, the static graph looks more reasonable.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>The NOTEARS graphs that are closest to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, with respect to the normalized Hamming distance as shown in <xref ref-type="table" rid="T3">Table&#x20;3</xref>. <bold>(A)</bold>: The static graph for <italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3. Note that in <xref ref-type="table" rid="T3">Table&#x20;3</xref> this graph is treated as an unweighted graph.The edge weights are estimates of the coefficients <italic>W</italic>
<sub>
<italic>ji</italic>
</sub> in the data generating model (4). The larger weights indicate stronger connection between two variables. <bold>(B)</bold>: The temporal graph for <italic>&#x3bb;</italic> &#x3d; 0.1, <italic>t</italic>&#x20;&#x3d; 0.3.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g007.tif"/>
</fig>
<p>In the static graph, the RH and precipitation seem to dominate the sea ice changes, with weights of 0.55 and 0.41, respectively. In the meantime, the sea ice exerts large influence on SW (weight of 0.79) and CW (weight of 0.31). The causal relations between precipitation, SW and sea ice in the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> are well captured by the NOTEARS algorithm. However, RH and CW are believed to be only indirectly connected with sea ice changes (i.e.,&#x20;in the domain knowledge graph there is no direct connection between RH or CW and sea ice), but in the static graph produced by the NOTEARS algorithm there are direct connections. The causality between each two atmospheric variables is generally reasonable based on the domain knowledge graph. The connections between CW and v10&#xa0;m, SW and v10&#xa0;m, and v10&#xa0;m and u10&#xa0;m are not quite consistent with the domain knowledge graph. However, those connections may be physically reasonable because winds are related to changing temperatures, humidity, clouds and radiation through advection in a broader area. Compared with the static graph, the temporal graph detects only very few edges. It shows that the sea ice, SW and GH have delayed impacts on themselves, demonstrating both sea ice and atmosphere have a degree of seasonal to year long climate predictability. Note that the NOTEARS does not model time delay of causal relations as mentioned in <xref ref-type="sec" rid="s4-4">Section 4.4</xref> and the temporal graphs that we produced using this algorithm do not contain straightforward-to-interpret time lag information.</p>
</sec>
</sec>
<sec id="s5-3">
<title>5.3 Causality Discovery Results Based on Directed Acyclic Graph-Graph Neural Networks Approach</title>
<p>Like the NOTEARS algorithm, DAG-GNN has two hyperparameters: <italic>&#x3c4;</italic> &#x2265; 0 and <italic>t</italic>&#x20;&#x2265; 0, where <italic>&#x3c4;</italic> is similar to <italic>&#x3bb;</italic> used in NOTEARS. We noticed that the hyperparameter <italic>&#x3c4;</italic> is very sensitive, and show the outputs for only two values of <italic>&#x3c4;</italic> i.e.,&#x20;<italic>&#x3c4;</italic> &#x2208;{0, <italic>e</italic>&#x20;&#x2212; 7}. We vary <italic>t</italic> similar to NOTEARS, and test for <italic>t</italic>&#x20;&#x2208;{0.2, 0.3}. <xref ref-type="table" rid="T4">Table&#x20;4</xref> tabulates the normalized Hamming Distance computed between all the graphs obtained by varying these two hyperparameters. Further, we computed the Normalized Hamming Distance between all these graphs and the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. In order to carry out this specific computation, we created unweighted matrices from the weighted outputs of DAG-GNN with the help of absolute thresholding using the hyperparameter&#x20;<italic>t</italic>.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Distance matrix with respect to the normalized Hamming distance for DAG-GNN. <italic>&#x2663;</italic> denotes the algorithm&#x2019;s default hyperparameters. The bottom row compares to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, with the best values being marked in bold.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left"/>
<th align="left"/>
<th colspan="4" align="center">
<italic>Static</italic>
</th>
<th colspan="4" align="center">
<italic>Temporal</italic>
</th>
</tr>
<tr>
<td colspan="2" align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; 0</td>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7</td>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; 0</td>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7</td>
<td align="center"/>
<td align="center"/>
<td align="center"/>
<td align="center"/>
</tr>
<tr>
<td colspan="2" align="left"/>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">
<italic>t</italic>&#x20;&#x3d; 0.3</td>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<italic>Static</italic>
</td>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.0</td>
<td align="center">0.06</td>
<td align="center">0.04</td>
<td align="center">0.07</td>
<td align="center">0.1</td>
<td align="center">0.12</td>
<td align="center">0.1</td>
<td align="center">0.12</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">0.06</td>
<td align="center">0.0</td>
<td align="center">0.05</td>
<td align="center">0.01</td>
<td align="center">0.08</td>
<td align="center">0.07</td>
<td align="center">0.08</td>
<td align="center">0.07</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.04</td>
<td align="center">0.05</td>
<td align="center">0.0</td>
<td align="center">0.06</td>
<td align="center">0.08</td>
<td align="center">0.1</td>
<td align="center">0.08</td>
<td align="center">0.1</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7, <italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">0.07</td>
<td align="center">0.01</td>
<td align="center">0.06</td>
<td align="center">0.0</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
</tr>
<tr>
<td align="left">
<italic>Temporal</italic>
</td>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.1</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
<td align="center">0.0</td>
<td align="center">0.03</td>
<td align="center">0.01</td>
<td align="center">0.03</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3<sup>
<italic>&#x2663;</italic>
</sup>
</td>
<td align="center">0.12</td>
<td align="center">0.07</td>
<td align="center">0.1</td>
<td align="center">0.08</td>
<td align="center">0.03</td>
<td align="center">0.0</td>
<td align="center">0.05</td>
<td align="center">0.0</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7, <italic>t</italic>&#x20;&#x3d; 0.2</td>
<td align="center">0.1</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
<td align="center">0.08</td>
<td align="center">0.01</td>
<td align="center">0.05</td>
<td align="center">0.0</td>
<td align="center">0.05</td>
</tr>
<tr>
<td align="left"/>
<td align="center">
<italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7, <italic>t</italic>&#x20;&#x3d; 0.3</td>
<td align="center">0.12</td>
<td align="center">0.07</td>
<td align="center">0.1</td>
<td align="center">0.08</td>
<td align="center">0.03</td>
<td align="center">0.0</td>
<td align="center">0.05</td>
<td align="center">0.0</td>
</tr>
<tr>
<td align="left"/>
<td align="center">Domain knowl</td>
<td align="center">0.33</td>
<td align="center">0.33</td>
<td align="center">0.35</td>
<td align="center">
<bold>0.32</bold>
</td>
<td align="center">0.35</td>
<td align="center">
<bold>0.34</bold>
</td>
<td align="center">0.36</td>
<td align="center">
<bold>0.34</bold>
</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>From <xref ref-type="table" rid="T4">Table&#x20;4</xref>, we see that the least normalized Hamming Distance with the Domain Knowledge Graph is obtained by <italic>&#x3c4;</italic> &#x3d; <italic>e</italic>&#x20;&#x2212; 7, <italic>t</italic>&#x20;&#x3d; 0.3 for the static model and <italic>&#x3c4;</italic> &#x2208;{0, <italic>e</italic>&#x20;&#x2212; 7}, <italic>t</italic>&#x20;&#x3d; 0.3 for the temporal model. Both the temporal models of <italic>t</italic>&#x20;&#x3d; 0.3 give the same graphs, which is shown in <xref ref-type="fig" rid="F8">Figure&#x20;8</xref> on the right. For the static model however, these optimum values of <italic>&#x3c4;</italic> and <italic>t</italic> produce a graph which shows no relation between sea ice and other atmospheric variables. Hence, we reject it. The second most optimum graph showing a dependence of sea ice with atmospheric variables is shown in <xref ref-type="fig" rid="F8">Figure&#x20;8</xref> on the left. Its hyperparameters are <italic>&#x3c4;</italic> &#x3d; 0 and <italic>t</italic>&#x20;&#x3d; 0.2. Further, we note that for the temporal model, the best graphs are obtained with <italic>t</italic>&#x20;&#x3d; 0.3, which is one of the default parameters used and suggested by the authors in (<xref ref-type="bibr" rid="B107">Yu et&#x20;al., 2019</xref>).</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>The DAG-GNN graphs that are closest to the domain knowledge graph of <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. <bold>(A)</bold>: The static graph for <italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2. The larger weights indicate stronger connection between two variables. <bold>(B)</bold>: The temporal graph for <italic>&#x3c4;</italic> &#x2208;{0, <italic>e</italic>&#x20;&#x2212; 7}, <italic>t</italic>&#x20;&#x3d; 0.3.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g008.tif"/>
</fig>
<sec id="s5-3-1">
<title>5.3.1 Comparison Between Directed Acyclic Graph-Graph Neural Networks Based Causality Graph and Domain Knowledge Graph</title>
<p>The static and the temporal graphs closest with the domain knowledge graph are shown in <xref ref-type="fig" rid="F8">Figure&#x20;8</xref>. Compared to NOTEARS, both static and temporal graphs produced by DAG-GNN are more complicated. The dynamical fields (u10&#xa0;m and v10&#xa0;m) dominate the sea ice changes, but with relatively small weights 0.21 and &#x2212;0.25, respectively. Here, the positive (negative) edge weights indicate a positive (negative) causal effect. In this case, the negative weights between v10&#xa0;m and sea ice suggest that increasing v10&#xa0;m tends to decrease sea ice. Stronger northward winds can enhance ice melt by increasing ice drifting (<xref ref-type="bibr" rid="B89">Spreen et&#x20;al., 2011</xref>) and bringing more heat and moisture from lower latitudes (<xref ref-type="bibr" rid="B110">Zhang et&#x20;al., 2013</xref>). In the meantime, positive zonal winds (u10&#xa0;m) generally isolate the Arctic from mid-latitudes, leading to cooling (in winter) and thus more sea ice (<xref ref-type="bibr" rid="B65">Overland and Wang, 2010</xref>). As for the causal relations between multiple atmospheric processes, they are generally reasonable compared to <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. Similar as NOTEARS, the connections between u10&#xa0;m and v10&#xa0;m (0.95), SW and v10&#xa0;m (0.25), CW and v10&#xa0;m (0.32) are not reasonable and consistent with domain knowledge graph. As mentioned earlier, this is most likely because we averaged these variables in the Arctic region and those variables may exhibit relatively high correlations over a large domain. Note that the increased CW and CC tend to reflect solar radiation back to the space, leaving less SW reaching at the surface. This negative relationships between CC, CW, and SW are captured by the DAG-GNN, however, the direction of arrows are not meaningful. The same issue occurs in the temporal graph. In addition, the sea ice has the delayed impacts on itself, but with no connection with any atmospheric processes in temporal graph. Like static graph, the causality between u10&#xa0;m and v10&#xa0;m as well as CW and v10&#xa0;m is not consistent with domain knowledge graph. Similar as NOTEARS, DAG-GNN does not model time delay of causal relations as&#x20;well.</p>
</sec>
</sec>
<sec id="s5-4">
<title>5.4 Sensitivity Tests</title>
<p>We conducted additional tests with slightly different datasets to show how the causality discovery approaches are sensitive to the data. Because the results above are based on the detrended and deseasonalized data sets, the first sensitivity test we did is with raw data. Here, we show the similar static graphs as <xref ref-type="fig" rid="F7">Figures 7</xref>, <xref ref-type="fig" rid="F8">8</xref>, but with raw data in <xref ref-type="fig" rid="F9">Figure&#x20;9</xref>. The TCDF still does not generate meaningful edges between atmospheric components and sea ice (not shown). The NOTEARS produces different results between raw data and detrended data. Using raw data, CC, GH, LW and SW dominate sea ice changes. In comparison, RH and precipitation have a large influence on sea ice variations based on detrended and deseasonalized data. The DAG-GNN also generates more complicated results with raw data. In particular, CW, GH, SLP, LW, and SW are found to dominate sea ice variations, which show similar results as NOTEARS. Note that both NOTEARS and DAG-GNN cannot capture the response in atmosphere to sea ice variations using raw data. As mentioned earlier, the relationships obtained from detrended and deseasonalized data represent natural variability, while raw data provides information about actual changes.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>The graphs produced with raw data sets (non-detrended and non-deseasonalized). <bold>(A)</bold>: The NOTEARS static graph for <italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3. <bold>(B)</bold>: The DAG-GNN static graph for <italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g009.tif"/>
</fig>
<p>The second sensitivity test we carried out is with dataset that also includes air temperature (averaged from 1,000&#x2013;300&#xa0;hPa). In <xref ref-type="fig" rid="F10">Figure&#x20;10</xref>, we show the similar static graphs as <xref ref-type="fig" rid="F7">Figures 7</xref>, <xref ref-type="fig" rid="F8">8</xref>, but include variable &#x201c;Temp&#x201d;. In general, the TCDF does not generate any meaningful results (not shown). The NOTEARS shows that temperatures have a large impact on the LW and HFLX, which is physically meaningful based on Stefan-Boltzmann law. In this case, RH dominates the changes in sea ice, while sea ice exerts large influence on SW. These results are similar to <xref ref-type="fig" rid="F7">Figure&#x20;7</xref>, in which we excluded temperature. According to results produced by DAG-GNN, temperatures have an impact on SLP, HFLX, CC, RH, LW, and v10&#xa0;m. These connections are relatively reasonable since we average those variables in a large domain. However, there is no edge between sea ice and atmospheric components anymore. We believe that the connections between sea ice and atmosphere could have been filtered out, because the edges among atmospheric components have much larger weights.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>The graphs produced with data sets including air temperature averaged from 1,000 to 300&#xa0;hPa. <bold>(A)</bold>: The NOTEARS static graph for <italic>&#x3bb;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.3. <bold>(B)</bold>: The DAG-GNN static graph for <italic>&#x3c4;</italic> &#x3d; 0, <italic>t</italic>&#x20;&#x3d; 0.2.</p>
</caption>
<graphic xlink:href="fdata-04-642182-g010.tif"/>
</fig>
</sec>
</sec>
<sec id="s6">
<title>6 Conclusion and Discussion</title>
<p>The Arctic has undergone dramatic changes in the past few decades, and sea ice decline is believed to be a key driver for the Arctic amplification. On the one hand, the sea ice is melted by mixed effects of atmospheric dynamical and thermodynamical processes. These processes on the other hand, can be largely affected by sea ice melt. Therefore, this study investigates the causality between multiple atmospheric processes and sea ice variations using three data-driven causality discovery approaches (TCDF, NOTEARS and DAG-GNN). As shown in previous sections, one advantage of utilizing these approaches is that they not only generate causal graphs, but also provide quantified information on causal strength through weights or time lags. Another advantage is that these approaches can take all relevant variables into consideration and find potentially important causal relationships, which is different from most related studies which only analyze pair-wise causality between two variables. Instead of performing computationally expensive climate model simulations, here we focus solely on an observational-based analysis. Specifically, we examine the sensitivity of causality graphs produced by three methods to different hyperparameters and then compare those graphs with domain knowledge&#x20;graph.</p>
<p>We found that the outputs of the three algorithms are rather sensitive to the choice of hyperparameters. For example, choosing an only slightly too large regularization parameter can result in NOTEARS or DAG-GNN producing empty graphs, that is not discovering any causal relationships at all. Also the values of the other parameters turned out to be important and outputs for different choices of the hyperparameters can be quite different. Hence, some care must be taken when applying data-driven causality discovery approaches and domain knowledge is indispensable for assessing whether their produced outputs are reasonable.</p>
<p>Compared to domain knowledge graph, the static graphs produced by NOTEARS and DAG-GNN are relatively reasonable. The results from NOTEARS suggest that RH and precipitation dominate sea ice changes among all variables. In the meantime, the sea ice has a large impact on SW and CW. The graph generated by DAG-GNN, however, indicates that the zonal (u10&#xa0;m) and meridional (v10&#xa0;m) wind fields are more important for driving sea ice variations than other variables. And there are no atmospheric variables being affected by the sea ice. Note that the edges between u10&#xa0;m and v10&#xa0;m, SW and v10&#xa0;m, CW and v10&#xa0;m are produced by both NOTEARS and DAG-GNN, which are different from domain knowledge graph, possibly due to the averages over a large domain. As for the temporal graphs, very few edges can be found in TCDF and NOTEARS. In comparison, the DAG-GNN is able to produce more complicated and meaningful results. The sea ice is found to have a delayed impact on itself, but with no causal relationship with any atmospheric processes. This is possibly because sea ice anomaly persistence is much stronger than the connections between sea ice and atmosphere. It is our hope that those causality graphs can be compared with the ones produced by other algorithms as Artificial Intelligence technologies are evolving rapidly. In the meantime, they can be also compared with the causal links captured by physical models for cross-validation.</p>
<p>Based on our analysis, it is still very challenging to directly apply these state-of-the-art data-driven causality discovery approaches to this specific climate topic. However, there are several limitations with current study, which potentially has a large influence on our results. 1) There are large uncertainties in the domain knowledge graph and thus cannot be considered as ground truth. Climate scientists strive to investigate the complex feedbacks between atmosphere and sea ice, but our knowledge in this field is still very limited and controversial. For example, a few recent studies have divergent consensuses on Arctic amplification&#x2019;s influence on mid-latitude severe winter weather (<xref ref-type="bibr" rid="B4">Blackport et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B18">Cohen et&#x20;al., 2019</xref>). 2) We average the atmospheric and sea ice variables within the pan-Arctic domain (north of 60&#xb0;N) and our analysis is only based on the time-series. However, the causal relationships between atmosphere and sea ice could be regionally dependent. 3) We use the full monthly atmosphere and sea ice records during 1980&#x2013;2018. The feedbacks between atmosphere and sea ice are highly variable with season, and physical mechanisms work differently with and without sunlight. For example, previous studies pointed out the cloud response to sea ice melt occurs in all seasons except in summer (<xref ref-type="bibr" rid="B46">Kay and Gettelman, 2009</xref>; <xref ref-type="bibr" rid="B95">Taylor et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B61">Morrison et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B36">Huang et&#x20;al., 2019a</xref>). Moreover, the interactions between atmosphere and sea ice may occur at shorter time scales (e.g., daily). 4) The weights among different atmospheric variables are much higher than those between atmosphere and sea ice. Thus, the edges in the latter category could have been filtered out. 6) We only consider the interactions between atmosphere and sea ice in this study. The oceanic processes (e.g., ocean currents, ocean salinity) might also exert large influence on sea ice variations in the Arctic. For example, when salt is ejected into the ocean as sea ice forms, the water&#x2019;s salinity increases. Therefore, a gradual freshening of the upper Arctic ocean will continue with Arctic sea ice decline (<xref ref-type="bibr" rid="B52">Li and Fedorov, 2021</xref>). Our study is a starting point to investigate the atmosphere-sea ice feedback using data-driven causality approaches, and it can be extended to the interactions between atmosphere, ocean, sea ice and even other components (e.g., land ice) in the future. 7) Only one global reanalysis product is used in this study and the results could be more robust if we expand our analysis with different products. It should be noted that the majority of connections considered in this study have been validated by different observational, reanalysis and/or climate models (<xref ref-type="bibr" rid="B21">Ding et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B2">Baxter et&#x20;al., 2019</xref>). Thus, we believe that our results may not highly depend on the choice of data sets. Moreover, all results shown in this study are based on detrended and deseasonalized data. We also performed additional experiments with raw data. Based on NOTEARS and DAG-GNN, geopotential heights, clouds, surface longwave, and shortwave flux are found to dominate sea ice changes, which are different from the results shown in <xref ref-type="fig" rid="F7">Figures 7</xref>,&#x20;<xref ref-type="fig" rid="F8">8</xref>.</p>
<p>Nevertheless, this is a pioneer study in the application of data-drive causality discovery approaches in the interactions between atmosphere and sea ice. This study will pave the way for us to disentangle the complicated causal relationships in the Earth system, by taking the advantage of cutting-edge data science and Artificial Intelligence technologies. It also provides a good opportunity for climate scientists, data scientists and computer scientists to work together to solve the puzzle in the nature, which will eventually advance our understanding of polar climate system and global climate change.</p>
</sec>
</body>
<back>
<sec id="s7">
<title>Data Availability Statement</title>
<p>The sea ice concentration and extent was obtained from the National Snow and Ice Data Center: <ext-link ext-link-type="uri" xlink:href="http://nsidc.org/data/NSIDC-0051">http://nsidc.org/data/NSIDC-0051</ext-link>. The ECMWF ERA-5 global reanalysis product can be found via <ext-link ext-link-type="uri" xlink:href="https://cds.climate.copernicus.eu/cdsapp#!/home">https://cds.climate.copernicus.eu/cdsapp&#x23;&#x21;/home</ext-link>. The codes and input for three models are available on GitHub: <ext-link ext-link-type="uri" xlink:href="https://github.com/big-data-lab-umbc/cybertraining/tree/master/year-3-projects/team-6">https://github.com/big-data-lab-umbc/cybertraining/tree/master/year-3-projects/team-6</ext-link>.</p>
</sec>
<sec id="s8">
<title>Author Contributions</title>
<p>YH downloaded data sets, carried out data pre-processing, prepared the domain knowledge graph and wrote the paper; MK, AM, and DV implemented the causal discovery methods, generated their graphs and wrote the paper; PG carried out data pre-processing, worked on attention based causality discovery and dealt with technical issues related to high performance computing; JW provided direction to the project and crucial guidance for this work; All authors participated in regular constructive discussions and contributed to interpreting the results and writing the paper.</p>
</sec>
<sec id="s9">
<title>Funding</title>
<p>This work is supported by the grant &#x201c;CyberTraining: DSE: Cross-Training of Researchers in Computing, Applied Mathematics and Atmospheric Sciences using Advanced Cyberinfrastructure Resources&#x201d; (OAC&#x2013;1730250) and grant &#x201c;CAREER: Big Data Climate Causality Analytics&#x201d; (OAC&#x2013;1942714) from the National Science Foundation.</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s11" sec-type="disclaimer">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>The hardware used in the computational studies is part of the UMBC High Performance Computing Facility (HPCF). The facility is supported by the United&#x20;States National Science Foundation through the MRI program (Grant Nos. CNS&#x2013;0821258, CNS&#x2013;1228778, and OAC&#x2013;1726023) and the SCREMS program (Grant Nos. DMS&#x2013;0821311), with additional substantial support from the University of Maryland, Baltimore County (UMBC). See <ext-link ext-link-type="uri" xlink:href="http://hpcf.umbc.edu">hpcf.umbc.edu</ext-link> for more information on HPCF and the projects using its resources. &#x2003;This manuscript has been released as a report at the UMBC High Performance Computing Facility (HPCF) web site (<xref ref-type="bibr" rid="B39">Huang et&#x20;al. (2020)</xref>.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Aragam</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Amini</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Learning Directed Acyclic Graphs with Penalized Neighbourhood Regression</article-title>. <source>ArXiv preprint</source>. <comment>ArXiv:1511.08963</comment>.</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baxter</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Schweiger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>L&#x2019;Heureux</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Baxter</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>How Tropical Pacific Surface Cooling Contributed to Accelerated Sea Ice Melt from 2007 to 2012 as Ice Is Thinned by Anthropogenic Forcing</article-title>. <source>J.&#x20;Clim.</source> <volume>32</volume>, <fpage>8583</fpage>&#x2013;<lpage>8602</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-18-0783.1</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bintanja</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Selten</surname>
<given-names>F. M.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Future Increases in Arctic Precipitation Linked to Local Evaporation and Sea-Ice Retreat</article-title>. <source>Nature</source> <volume>509</volume>, <fpage>479</fpage>&#x2013;<lpage>482</lpage>. <pub-id pub-id-type="doi">10.1038/nature13259</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Blackport</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Screen</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>van der Wiel</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Bintanja</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Minimal Influence of Reduced Arctic Sea Ice on Coincident Cold winters in Mid-latitudes</article-title>. <source>Nat. Clim. Chang.</source> <volume>9</volume>, <fpage>697</fpage>&#x2013;<lpage>704</lpage>. <pub-id pub-id-type="doi">10.1038/s41558-019-0551-4</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boisvert</surname>
<given-names>L. N.</given-names>
</name>
<name>
<surname>Stroeve</surname>
<given-names>J.&#x20;C.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>The Arctic Is Becoming Warmer and Wetter as Revealed by the Atmospheric Infrared Sounder</article-title>. <source>Geophys. Res. Lett.</source> <volume>42</volume>, <fpage>4439</fpage>&#x2013;<lpage>4446</lpage>. <pub-id pub-id-type="doi">10.1002/2015gl063775</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boisvert</surname>
<given-names>L. N.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Shie</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Increasing Evaporation Amounts Seen in the Arctic between 2003 and 2013 from AIRS Data</article-title>. <source>J.&#x20;Geophys. Res. Atmospheres</source> <volume>120</volume>, <fpage>6865</fpage>&#x2013;<lpage>6881</lpage>. <pub-id pub-id-type="doi">10.1002/2015jd023258</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boisvert</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Webster</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Petty</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Markus</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bromwich</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Cullather</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Intercomparison of Precipitation Estimates over the Arctic Ocean and its Peripheral Seas from Reanalyses</article-title>. <source>J.&#x20;Clim.</source> <volume>31</volume>, <fpage>8441</fpage>&#x2013;<lpage>8462</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-18-0125.1</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Brockwell</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Brockwell</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>R. A.</given-names>
</name>
</person-group> (<year>2016</year>). <source>Introduction to Time Series and Forecasting</source>. <publisher-name>Springer</publisher-name>.</citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cavalieri</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Crawford</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Drinkwater</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Emery</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Eppler</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Farmer</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>1992</year>). &#x201c;<article-title>NASA Sea Ice Validation Program for the DMSP SSM/I: Final Report, NASA Technical Memorandum 104559</article-title>,&#x201d; in <source>Tech. Rep</source> (<publisher-loc>Washington, D.C.</publisher-loc>: <publisher-name>National Aeronautics and Space Administration</publisher-name>). </citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cavalieri</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Parkinson</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Gloersen</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Zwally</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>1996</year>). <source>Sea Ice Concentrations from Nimbus-7 SMMR and DMSP SSM/I-SSMIS Passive Microwave Data, Version 1</source> (<publisher-loc>Boulder, CO, United States</publisher-loc>: <publisher-name>NASA National Snow and Ice Data Center Distributed Active Archive Center</publisher-name>). <pub-id pub-id-type="doi">10.5067/8GQ8LZQVL0VL</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chemke</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Polvani</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Deser</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>The Effect of Arctic Sea Ice Loss on the Hadley Circulation</article-title>. <source>Geophys. Res. Lett.</source> <volume>46</volume>, <fpage>963</fpage>&#x2013;<lpage>972</lpage>. <pub-id pub-id-type="doi">10.1029/2018gl081110</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chickering</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Learning Bayesian Networks Is NP-Complete</article-title>. In <source>Learning from Data</source> (<publisher-name>Springer</publisher-name>), <volume>Vol. 112</volume> of <comment>Lecture Notes in Statistics</comment>
<pub-id pub-id-type="doi">10.1007/978-1-4612-2404-4_12</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choi</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Hur</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ho</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Connecting Early Summer Cloud-Controlled Sunlight and Late Summer Sea Ice in the Arctic</article-title>. <source>J.&#x20;Geophys. Res. Atmospheres</source> <volume>119</volume>, <fpage>11,087</fpage>&#x2013;<lpage>11,099</lpage>. <pub-id pub-id-type="doi">10.1002/2014jd022013</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Danks</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Glymour</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2005</year>). &#x201c;<article-title>Data Driven Methods for Nonlinear Granger Causality: Climate Teleconnection Mechanisms</article-title>,&#x201d; in <source>Tech. Rep. CMU-PHIL-171</source> (<publisher-name>Department of Philosophy, Carnegie Mellon University</publisher-name>). </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chu</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Glymour</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Search for Additive Nonlinear Time Series Causal Models</article-title>. <source>J.&#x20;Machine Learn. Res.</source> <volume>9</volume>, <fpage>967</fpage>&#x2013;<lpage>991</lpage>. <pub-id pub-id-type="doi">10.5555/1390681.1390713</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Screen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Furtado</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Barlow</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Whittleston</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Coumou</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Recent Arctic Amplification and Extreme Mid-latitude Weather</article-title>. <source>Nat. Geosci</source> <volume>7</volume>, <fpage>627</fpage>&#x2013;<lpage>637</lpage>. <pub-id pub-id-type="doi">10.1038/ngeo2234</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cohen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Francis</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jung</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kwok</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Overland</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Divergent Consensuses on Arctic Amplification Influence on Midlatitude Severe winter Weather</article-title>. <source>Nat. Clim. Change</source> <volume>10</volume>, <fpage>20</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1038/s41558-019-0662-y</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cox</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Uttal</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>C. N.</given-names>
</name>
<name>
<surname>Shupe</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Stone</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Starkweather</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The Role of Springtime Arctic Clouds in Determining Autumn Sea Ice Extent</article-title>. <source>J.&#x20;Clim.</source> <volume>29</volume>, <fpage>6581</fpage>&#x2013;<lpage>6596</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-16-0136.1</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cruz-Garc&#xed;a</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Guemas</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Chevallier</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Massonnet</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>An Assessment of Regional Sea Ice Predictability in the Arctic Ocean</article-title>. <source>Clim. Dyn.</source> <volume>53</volume>, <fpage>427</fpage>&#x2013;<lpage>440</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-018-4592-6</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ding</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Schweiger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>L&#x2019;Heureux</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Battisti</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Po-Chedley</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>N. C.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Influence of High-Latitude Atmospheric Circulation Changes on Summertime Arctic Sea Ice</article-title>. <source>Nat. Clim Change</source> <volume>7</volume>, <fpage>289</fpage>&#x2013;<lpage>295</lpage>. <pub-id pub-id-type="doi">10.1038/nclimate3241</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Donnat</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Holmes</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Tracking Network Dynamics: A Survey Using Graph Distances</article-title>. <source>Ann. Appl. Stat.</source> <volume>12</volume>, <fpage>971</fpage>&#x2013;<lpage>1012</lpage>. <pub-id pub-id-type="doi">10.1214/18-aoas1176</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ebert-Uphoff</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Causal Discovery for Climate Research Using Graphical Models</article-title>. <source>J.&#x20;Clim.</source> <volume>25</volume>, <fpage>5648</fpage>&#x2013;<lpage>5665</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-11-00387.1</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Entner</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hoyer</surname>
<given-names>P. O.</given-names>
</name>
</person-group> (<year>2010</year>). &#x201c;<article-title>On Causal Discovery from Time Series Data Using FCI</article-title>,&#x201d; in <conf-name>Proceedings of the Fifth European Workshop on Probabilistic Graphical Models</conf-name>, <conf-loc>Helsinki, Finland</conf-loc>. Editors <person-group person-group-type="editor">
<name>
<surname>Myllymaeki</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Roos</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Jaakkola</surname>
<given-names>T.</given-names>
</name>
</person-group> (<publisher-name>HIIT Publications, 2010</publisher-name>), <fpage>121</fpage>&#x2013;<lpage>128</lpage>. </citation>
</ref>
<ref id="B25">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Eveleigh</surname>
<given-names>V. W.</given-names>
</name>
</person-group> (<year>1967</year>). &#x201c;<article-title>McGraw-Hill Electrical and Electronic Engineering Series</article-title>,&#x201d; in <source>Adaptive Control and Optimization Techniques</source> (<publisher-loc>New York</publisher-loc>: <publisher-name>McGraw-Hill</publisher-name>). </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Graham</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Cohen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Ritzhaupt</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Segger</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Graversen</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Rinke</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Evaluation of Six Atmospheric Reanalyses over Arctic Sea Ice from winter to Early Summer</article-title>. <source>J.&#x20;Clim.</source> <volume>32</volume>, <fpage>4121</fpage>&#x2013;<lpage>4143</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-18-0643.1</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Granger</surname>
<given-names>C. W. J.</given-names>
</name>
</person-group> (<year>1969</year>). <article-title>Investigating Causal Relations by Econometric Models and Cross-Spectral Methods</article-title>. <source>Econometrica</source> <volume>37</volume>, <fpage>424</fpage>&#x2013;<lpage>438</lpage>. <pub-id pub-id-type="doi">10.2307/1912791</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guemas</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Blanchard-Wrigglesworth</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Chevallier</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Day</surname>
<given-names>J.&#x20;J.</given-names>
</name>
<name>
<surname>D&#xe9;qu&#xe9;</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Doblas-Reyes</surname>
<given-names>F. J.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>A Review on Arctic Sea-Ice Predictability and Prediction on Seasonal to Decadal Time-Scales</article-title>. <source>Q.J.R. Meteorol. Soc.</source> <volume>142</volume>, <fpage>546</fpage>&#x2013;<lpage>561</lpage>. <pub-id pub-id-type="doi">10.1002/qj.2401</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guo</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hahn</surname>
<given-names>P. R.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>A Survey of Learning Causality with Data: Problems and Methods</article-title>. <source>ACM Computing Surveys (CSUR)</source> <volume>53</volume>, <fpage>1</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1145/3397269</pub-id> </citation>
</ref>
<ref id="B30">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hamilton</surname>
<given-names>J.&#x20;D.</given-names>
</name>
</person-group> (<year>1994</year>). <source>Time Series Analysis</source>. <publisher-name>Princeton University Press</publisher-name>.</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heckerman</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Geiger</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chickering</surname>
<given-names>D. M.</given-names>
</name>
</person-group> (<year>1995</year>). <article-title>Learning Bayesian Networks: The Combination of Knowledge and Statistical Data</article-title>. <source>Mach Learn.</source> <volume>20</volume>, <fpage>197</fpage>&#x2013;<lpage>243</lpage>. <pub-id pub-id-type="doi">10.1007/bf00994016</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hersbach</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Bell</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Berrisford</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Hirahara</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hor&#xe1;nyi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mu&#xf1;oz-Sabater</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>The ERA5 Global Reanalysis</article-title>. <source>Q. J.&#x20;R. Meteorol. Soc.</source> <volume>146</volume>, <fpage>1999</fpage>&#x2013;<lpage>2049</lpage>. <pub-id pub-id-type="doi">10.1002/qj.3803</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hochreiter</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>1998</year>). <article-title>The Vanishing Gradient Problem during Learning Recurrent Neural Nets and Problem Solutions</article-title>. <source>Int. J.&#x20;Unc. Fuzz. Knowl. Based Syst.</source> <volume>06</volume>, <fpage>107</fpage>&#x2013;<lpage>116</lpage>. <pub-id pub-id-type="doi">10.1142/s0218488598000094</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Holland</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Bitz</surname>
<given-names>C. M.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Polar Amplification of Climate Change in Coupled Models</article-title>. <source>Clim. Dyn.</source> <volume>21</volume>, <fpage>221</fpage>&#x2013;<lpage>232</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-003-0332-6</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Holland</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Landrum</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bailey</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Vavrus</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Changing Seasonal Predictability of Arctic Summer Sea Ice Area in a Warming Climate</article-title>. <source>J.&#x20;Clim.</source> <volume>32</volume>, <fpage>4963</fpage>&#x2013;<lpage>4979</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-19-0034.1</pub-id> </citation>
</ref>
<ref id="B112">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Baxter</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Summertime Low Clouds Mediate The Impact Of The Large-Scale Circulation On Arctic Sea Ice</article-title>. <source>Commun. Earth Environ.</source> <volume>2</volume>, <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1038/s43247-021-00114-w</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Bailey</surname>
<given-names>D. A.</given-names>
</name>
<name>
<surname>Holland</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>DuVivier</surname>
<given-names>A. K.</given-names>
</name>
<etal/>
</person-group> (<year>2019a</year>). <article-title>Thicker Clouds and Accelerated Arctic Sea Ice Decline: The Atmosphere&#x2010;Sea Ice Interactions in Spring</article-title>. <source>Geophys. Res. Lett.</source> <volume>46</volume>, <fpage>6980</fpage>&#x2013;<lpage>6989</lpage>. <pub-id pub-id-type="doi">10.1029/2019gl082791</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019b</year>). <article-title>A Survey of the Atmospheric Physical Processes Key to the Onset of Arctic Sea Ice Melt in spring</article-title>. <source>Clim. Dyn.</source> <volume>52</volume>, <fpage>4907</fpage>&#x2013;<lpage>4922</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-018-4422-x</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Dolinar</surname>
<given-names>E. K.</given-names>
</name>
<name>
<surname>Stanfield</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>The Footprints of 16&#x20;Year Trends of Arctic Springtime Cloud and Radiation Properties on September Sea Ice Retreat</article-title>. <source>J.&#x20;Geophys. Res. Atmos.</source> <volume>122</volume>, <fpage>2179</fpage>&#x2013;<lpage>2193</lpage>. <pub-id pub-id-type="doi">10.1002/2016jd026020</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kleindessner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Munishkin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Varshney</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). &#x201c;<article-title>Benchmarking of Data-Driven Causality Discovery Approaches in the Interactions of Arctic Sea Ice and Atmosphere</article-title>,&#x201d; in <source>Technical Report HPCF-2020-16, UMBC High Performance Computing Facility</source> (<publisher-loc>Baltimore County</publisher-loc>: <publisher-name>University of Maryland</publisher-name>). </citation>
</ref>
<ref id="B40">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Hussung</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mahmud</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sampath</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>Evaluation of Data-Driven Causality Discovery Approaches Among Dominant Climate Modes</article-title>,&#x201d; in <source>Technical Report HPCF-2019-12, UMBC High Performance Computing Facility</source> (<publisher-loc>Baltimore County</publisher-loc>: <publisher-name>University of Maryland</publisher-name>). </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iler</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Inouye</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Schmidt</surname>
<given-names>N. M.</given-names>
</name>
<name>
<surname>H&#xf8;ye</surname>
<given-names>T. T.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Detrending Phenological Time Series Improves Climate-Phenology Analyses and Reveals Evidence of Plasticity</article-title>. <source>Ecology</source> <volume>98</volume>, <fpage>647</fpage>&#x2013;<lpage>655</lpage>. <pub-id pub-id-type="doi">10.1002/ecy.1690</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kapsch</surname>
<given-names>M.-L.</given-names>
</name>
<name>
<surname>Graversen</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Tjernstr&#xf6;m</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bintanja</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The Effect of Downwelling Longwave and Shortwave Radiation on Arctic Summer Sea Ice</article-title>. <source>J.&#x20;Clim.</source> <volume>29</volume>, <fpage>1143</fpage>&#x2013;<lpage>1159</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-15-0238.1</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kapsch</surname>
<given-names>M.-L.</given-names>
</name>
<name>
<surname>Graversen</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Tjernstr&#xf6;m</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Springtime Atmospheric Energy Transport and the Control of Arctic Summer Sea-Ice Extent</article-title>. <source>Nat. Clim Change</source> <volume>3</volume>, <fpage>744</fpage>&#x2013;<lpage>748</lpage>. <pub-id pub-id-type="doi">10.1038/nclimate1884</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kapsch</surname>
<given-names>M.-L.</given-names>
</name>
<name>
<surname>Skific</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Graversen</surname>
<given-names>R. G.</given-names>
</name>
<name>
<surname>Tjernstr&#xf6;m</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Francis</surname>
<given-names>J.&#x20;A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Summers with Low Arctic Sea Ice Linked to Persistence of spring Atmospheric Circulation Patterns</article-title>. <source>Clim. Dyn.</source> <volume>52</volume>, <fpage>2497</fpage>&#x2013;<lpage>2512</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-018-4279-z</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kawale</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Liess</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Steinbach</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Snyder</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>V.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>A Graph-Based Approach to Find Teleconnections in Climate Data</article-title>. <source>Stat. Analy Data Mining</source> <volume>6</volume>, <fpage>158</fpage>&#x2013;<lpage>179</lpage>. <pub-id pub-id-type="doi">10.1002/sam.11181</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kay</surname>
<given-names>J.&#x20;E.</given-names>
</name>
<name>
<surname>Gettelman</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Cloud Influence on and Response to Seasonal Arctic Sea Ice Loss</article-title>. <source>J.&#x20;Geophys. Res. Atmospheres</source> <volume>114</volume>. <pub-id pub-id-type="doi">10.1029/2009jd011773</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kennel</surname>
<given-names>C. F.</given-names>
</name>
<name>
<surname>Yulaeva</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Influence of Arctic Sea-Ice Variability on Pacific Trade Winds</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>117</volume>, <fpage>2824</fpage>&#x2013;<lpage>2834</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1717707117</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Kingma</surname>
<given-names>D. P.</given-names>
</name>
<name>
<surname>Welling</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2014</year>). &#x201c;<article-title>Auto-Encoding Variational Bayes</article-title>,&#x201d; in <conf-name>2nd International Conference on Learning Representations, ICLR 2014. Conference Track Proceedings</conf-name>, <conf-loc>Banff, AB, Canada</conf-loc>, <conf-date>April 14-16, 2014</conf-date>. Editors <person-group person-group-type="editor">
<name>
<surname>Bengio</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>LeCun</surname>
<given-names>Y.</given-names>
</name>
</person-group> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kopec</surname>
<given-names>B. G.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Michel</surname>
<given-names>F. A.</given-names>
</name>
<name>
<surname>Posmentier</surname>
<given-names>E. S.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Influence of Sea Ice on Arctic Precipitation</article-title>. <source>Proc. Natl. Acad. Sci. USA</source> <volume>113</volume>, <fpage>46</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1504633113</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kretschmer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Coumou</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Donges</surname>
<given-names>J.&#x20;F.</given-names>
</name>
<name>
<surname>Runge</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Using Causal Effect Networks to Analyze Different Arctic Drivers of Midlatitude Winter Circulation</article-title>. <source>J.&#x20;Clim.</source> <volume>29</volume>, <fpage>4069</fpage>&#x2013;<lpage>4081</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-15-0654.1</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Feldstein</surname>
<given-names>S. B.</given-names>
</name>
<name>
<surname>Screen</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Revisiting the Cause of the 1989&#x2013;2009 Arctic Surface Warming Using the Surface Energy Budget: Downward Infrared Radiation Dominates the Surface Fluxes</article-title>. <source>Geophys. Res. Lett.</source> <volume>44</volume>, <fpage>10</fpage>&#x2013;<lpage>654</lpage>. <pub-id pub-id-type="doi">10.1002/2017gl075375</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Fedorov</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>W.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>AMOC stability and diverging response to Arctic sea ice decline in two climate models</article-title>. <source>J. Clim.</source> <volume>34</volume>, <fpage>5443</fpage>&#x2013;<lpage>5460</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-20-0572.1</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Loh</surname>
<given-names>P.-L.</given-names>
</name>
<name>
<surname>B&#xfc;hlmann</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>High-Dimensional Learning of Linear Causal Networks via Inverse Covariance Estimation</article-title>. <source>J.&#x20;Machine Learn. Res.</source> <volume>15</volume>, <fpage>3065</fpage>&#x2013;<lpage>3105</lpage>. </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Atmospheric Circulation Patterns Which Promote winter Arctic Sea Ice Decline</article-title>. <source>Environ. Res. Lett.</source> <volume>12</volume>, <fpage>054017</fpage>. <pub-id pub-id-type="doi">10.1088/1748-9326/aa69d0</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019a</year>). <article-title>The winter Midlatitude-Arctic Interaction: Effects of North Atlantic SST and High-Latitude Blocking on Arctic Sea Ice and Eurasian Cooling</article-title>. <source>Clim. Dyn.</source> <volume>52</volume>, <fpage>2981</fpage>&#x2013;<lpage>3004</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-018-4301-5</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Changes in Atmospheric Blocking Circulations Linked with winter Arctic Warming: A New Perspective</article-title>. <source>J.&#x20;Clim.</source> <volume>31</volume>, <fpage>7661</fpage>&#x2013;<lpage>7678</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-18-0040.1</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Overland</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019b</year>). <article-title>Weakened Potential Vorticity Barrier Linked to Recent winter Arctic Sea Ice Loss and Midlatitude Cold Extremes</article-title>. <source>J.&#x20;Clim.</source> <volume>32</volume>, <fpage>4235</fpage>&#x2013;<lpage>4261</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-18-0449.1</pub-id> </citation>
</ref>
<ref id="B113">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Baxter</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bushuk</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Summertime Atmosphere&#x2013;Sea Ice Coupling In The Arctic Simulated By CMIP5/6 Models: Importance Of Large-Scale Circulation</article-title>. <source>Clim. Dyn.</source> <volume>56</volume>, <fpage>1467</fpage>&#x2013;<lpage>1485</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-020-05543-5</pub-id>
</citation>
</ref>
<ref id="B114">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marcovecchio</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Behrangi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xi</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Precipitation Influence on and Response to Early and Late Arctic Sea Ice Melt Onset During Melt Season</article-title>. <source>Inter. J. Climatol.</source>, <fpage>1</fpage>&#x2013;<lpage>16</lpage>. <pub-id pub-id-type="doi">10.1002/joc.7233</pub-id>
</citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matthewman</surname>
<given-names>N. J.</given-names>
</name>
<name>
<surname>Magnusdottir</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Observed Interaction between Pacific Sea Ice and the Western Pacific Pattern on Intraseasonal Time Scales</article-title>. <source>J.&#x20;Clim.</source> <volume>24</volume>, <fpage>5031</fpage>&#x2013;<lpage>5042</lpage>. <pub-id pub-id-type="doi">10.1175/2011jcli4216.1</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mayer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tietsche</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Haimberger</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Tsubouchi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Mayer</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zuo</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>An Improved Estimate of the Coupled Arctic Energy Budget</article-title>. <source>J.&#x20;Clim.</source> <volume>32</volume>, <fpage>7915</fpage>&#x2013;<lpage>7934</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-19-0233.1</pub-id> </citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>McGraw</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Barnes</surname>
<given-names>E. A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Memory Matters: A Case for Granger Causality in Climate Variability Studies</article-title>. <source>J.&#x20;Clim.</source> <volume>31</volume>, <fpage>3289</fpage>&#x2013;<lpage>3300</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-17-0334.1</pub-id> </citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Morrison</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kay</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chepfer</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Guzman</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Yettella</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Isolating the Liquid Cloud Response to Recent Arctic Sea Ice Variability Using Spaceborne Lidar Observations</article-title>. <source>J.&#x20;Geophys. Res. Atmospheres</source> <volume>123</volume>, <fpage>473</fpage>&#x2013;<lpage>490</lpage>. <pub-id pub-id-type="doi">10.1002/2017jd027248</pub-id> </citation>
</ref>
<ref id="B62">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Nauta</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bucur</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Seifert</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>Causal Discovery with Attention-Based Convolutional Neural Networks</article-title>,&#x201d; in <source>Machine Learning and Knowledge Extraction</source>, <volume>1</volume>, <fpage>312</fpage>&#x2013;<lpage>340</lpage>. <comment>Code available on: <ext-link ext-link-type="uri" xlink:href="https://github.com/M-Nauta/TCDF">https://github.com/M-Nauta/TCDF</ext-link>
</comment>. <pub-id pub-id-type="doi">10.3390/make1010019</pub-id> </citation>
</ref>
<ref id="B63">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Nocedal</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wright</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2006</year>). <source>Numerical Optimization</source>. <publisher-name>Springer</publisher-name>.</citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nussbaumer</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Pinker</surname>
<given-names>R. T.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Role of Shortwave Radiation in the 2007 Arctic Sea Ice Anomaly</article-title>. <source>Geophys. Res. Lett.</source> <volume>39</volume>, <fpage>L15808</fpage>. <pub-id pub-id-type="doi">10.1029/2012gl052415</pub-id> </citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Overland</surname>
<given-names>J.&#x20;E.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Large-scale Atmospheric Circulation Changes Are Associated with the Recent Loss of Arctic Sea Ice</article-title>. <source>Tellus A: Dynamic Meteorology and Oceanography</source> <volume>62</volume>, <fpage>1</fpage>&#x2013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1111/j.1600-0870.2009.00421.x</pub-id> </citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Overpeck</surname>
<given-names>J.&#x20;T.</given-names>
</name>
<name>
<surname>Meehl</surname>
<given-names>G. A.</given-names>
</name>
<name>
<surname>Bony</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Easterling</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Climate Data Challenges in the 21st Century</article-title>. <source>Science</source> <volume>331</volume>, <fpage>700</fpage>&#x2013;<lpage>702</lpage>. <pub-id pub-id-type="doi">10.1126/science.1197869</pub-id> </citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Parkinson</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Comiso</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>On the 2012 Record Low Arctic Sea Ice Cover: Combined Impact of Preconditioning and an August Storm</article-title>. <source>Geophys. Res. Lett.</source> <volume>40</volume>. <pub-id pub-id-type="doi">10.1002/grl.50349</pub-id> </citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Perovich</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Grenfell</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Light</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Hobbs</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Seasonal Evolution of the Albedo of Multiyear Arctic Sea Ice</article-title>. <source>J.&#x20;Geophys. Res. Oceans</source> <volume>107</volume>, <fpage>SHE20-1-SHE 20-13</fpage>. <pub-id pub-id-type="doi">10.1029/2000jc000438</pub-id> </citation>
</ref>
<ref id="B69">
<citation citation-type="book">
<comment>[Dataset]</comment> <person-group person-group-type="author">
<name>
<surname>Peters</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Janzing</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Sch&#xf6;lkopf</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Causal Inference on Time Series Using Structural Equation Models</article-title>. <source>arXiv preprint</source>. <comment>arXiv:1207.5136</comment>.</citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ramsey</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Glymour</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Sanchez-Romero</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Glymour</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A Million Variables and More: the Fast Greedy Equivalence Search Algorithm for Learning High-Dimensional Graphical Causal Models, with an Application to Functional Magnetic Resonance Images</article-title>. <source>Int. J.&#x20;Data Sci. Anal.</source> <volume>3</volume>, <fpage>121</fpage>&#x2013;<lpage>129</lpage>. <pub-id pub-id-type="doi">10.1007/s41060-016-0032-z</pub-id> </citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rinke</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Knudsen</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Mewes</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dorn</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Handorf</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dethloff</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Arctic Summer Sea Ice Melt and Related Atmospheric Conditions in Coupled Regional Climate Model Simulations and Observations</article-title>. <source>J.&#x20;Geophys. Res. Atmospheres</source> <volume>124</volume>, <fpage>6027</fpage>&#x2013;<lpage>6039</lpage>. <pub-id pub-id-type="doi">10.1029/2018jd030207</pub-id> </citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Runge</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Nowack</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Kretschmer</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Flaxman</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sejdinovic</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Detecting and Quantifying Causal Associations in Large Nonlinear Time Series Datasets</article-title>. <source>Sci. Adv.</source> <volume>5</volume>, <fpage>eaau4996</fpage>. <pub-id pub-id-type="doi">10.1126/sciadv.aau4996</pub-id> </citation>
</ref>
<ref id="B73">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Samarasinghe</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>McGraw</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Barnes</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ebert-Uphoff</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>A Study of Links between the Arctic and the Midlatitude Jet Stream Using Granger and Pearl Causality</article-title>. <source>Environmetrics</source> <volume>30</volume>, <fpage>e2540</fpage>. <pub-id pub-id-type="doi">10.1002/env.2540</pub-id> </citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schmidhuber</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Deep Learning in Neural Networks: An Overview</article-title>. <source>Neural networks</source> <volume>61</volume>, <fpage>85</fpage>&#x2013;<lpage>117</lpage>. <pub-id pub-id-type="doi">10.1016/j.neunet.2014.09.003</pub-id> </citation>
</ref>
<ref id="B75">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Screen</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Bracegirdle</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Polar Climate Change as Manifest in Atmospheric Circulation</article-title>. <source>Curr. Clim. Change Rep.</source> <volume>4</volume>, <fpage>383</fpage>&#x2013;<lpage>395</lpage>. <pub-id pub-id-type="doi">10.1007/s40641-018-0111-4</pub-id> </citation>
</ref>
<ref id="B76">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Screen</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Declining Summer Snowfall in the Arctic: Causes, Impacts and Feedbacks</article-title>. <source>Clim. Dyn.</source> <volume>38</volume>, <fpage>2243</fpage>&#x2013;<lpage>2256</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-011-1105-2</pub-id> </citation>
</ref>
<ref id="B77">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Screen</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Keay</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Dramatic Interannual Changes of Perennial Arctic Sea Ice Linked to Abnormal Summer Storm Activity</article-title>. <source>J.&#x20;Geophys. Res. Atmospheres</source> <volume>116</volume>, <fpage>D15105</fpage>. <pub-id pub-id-type="doi">10.1029/2011jd015847</pub-id> </citation>
</ref>
<ref id="B78">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Semmler</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>McGrath</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Impact of Arctic Sea Ice on the Arctic Energy Budget and on the Climate of the Northern Mid-latitudes</article-title>. <source>Clim. Dyn.</source> <volume>39</volume>, <fpage>s</fpage>&#x2013;<lpage>2694</lpage>. <pub-id pub-id-type="doi">10.1007/s00382-012-1353-9</pub-id> </citation>
</ref>
<ref id="B79">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Serreze</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Stroeve</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Arctic Sea Ice Trends, Variability and Implications for Seasonal Ice Forecasting</article-title>. <source>Philos. Trans. A. Math. Phys. Eng. Sci.</source> <volume>373</volume>, <fpage>20140159</fpage>. <pub-id pub-id-type="doi">10.1098/rsta.2014.0159</pub-id> </citation>
</ref>
<ref id="B80">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Serreze</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Barry</surname>
<given-names>R. G.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Processes and Impacts of Arctic Amplification: A Research Synthesis</article-title>. <source>Glob. Planet. Change</source> <volume>77</volume>, <fpage>85</fpage>&#x2013;<lpage>96</lpage>. <pub-id pub-id-type="doi">10.1016/j.gloplacha.2011.03.004</pub-id> </citation>
</ref>
<ref id="B81">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Burke</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Keay</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Arctic Climate Change as Manifest in Cyclone Behavior</article-title>. <source>J.&#x20;Clim.</source> <volume>21</volume>, <fpage>5777</fpage>&#x2013;<lpage>5796</lpage>. <pub-id pub-id-type="doi">10.1175/2008jcli2366.1</pub-id> </citation>
</ref>
<ref id="B82">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Comparing and Contrasting the Behaviour of Arctic and Antarctic Sea Ice over the 35&#x20;Year Period 1979-2013</article-title>. <source>Ann. Glaciol.</source> <volume>56</volume>, <fpage>18</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.3189/2015aog69a909</pub-id> </citation>
</ref>
<ref id="B83">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Govekar</surname>
<given-names>P. D.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>What Are the Physical Links between Arctic Sea Ice Loss and Eurasian winter Climate?</article-title>. <source>Environ. Res. Lett.</source> <volume>9</volume>, <fpage>101003</fpage>. <pub-id pub-id-type="doi">10.1088/1748-9326/9/10/101003</pub-id> </citation>
</ref>
<ref id="B84">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Keay</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Extraordinary September Arctic Sea Ice Reductions and Their Relationships with Storm Behavior over 1979&#x2013;2008</article-title>. <source>Geophys. Res. Lett.</source> <volume>36</volume>, <fpage>L19715</fpage>. <pub-id pub-id-type="doi">10.1029/2009gl039810</pub-id> </citation>
</ref>
<ref id="B85">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Rudeva</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>A Comparison of Tracking Methods for Extreme Cyclones in the Arctic basin</article-title>. <source>Tellus A: Dynamic Meteorology and Oceanography</source> <volume>66</volume>, <fpage>25252</fpage>. <pub-id pub-id-type="doi">10.3402/tellusa.v66.25252</pub-id> </citation>
</ref>
<ref id="B86">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Rudeva</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>The Great Arctic Cyclone of August 2012</article-title>. <source>Geophys. Res. Lett.</source> <volume>39</volume>, <fpage>n/a</fpage>. <pub-id pub-id-type="doi">10.1029/2012gl054259</pub-id> </citation>
</ref>
<ref id="B87">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Song</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Hybrid Causality Analysis of ENSO&#x27;s Global Impacts on Climate Variables Based on Data-Driven Analytics and Climate Model Simulation</article-title>. <source>Front. Earth Sci.</source> <volume>7</volume>, <fpage>233</fpage>. <pub-id pub-id-type="doi">10.3389/feart.2019.00233</pub-id> </citation>
</ref>
<ref id="B88">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Song</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tian</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Spatio-Temporal Climate Data Causality Analytics-An Analysis of ENSO&#x2019;s Global Impacts</article-title>,&#x201d; in <conf-name>Proceedings of the 8th International Workshop on Climate Informatics (CI2018)</conf-name>, <conf-loc>Boulder, CO, United States</conf-loc>, <conf-date>September 19&#x2013;21, 2018</conf-date>, <fpage>45</fpage>&#x2013;<lpage>48</lpage>. </citation>
</ref>
<ref id="B89">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spreen</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Kwok</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Menemenlis</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Trends in Arctic Sea Ice Drift and Role of Wind Forcing: 1992&#x2013;2009</article-title>. <source>Geophys. Res. Lett.</source> <volume>38</volume>. <pub-id pub-id-type="doi">10.1029/2011gl048970</pub-id> </citation>
</ref>
<ref id="B90">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Stocker</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Qin</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Plattner</surname>
<given-names>G.-K.</given-names>
</name>
<name>
<surname>Alexander</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Allen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bindoff</surname>
<given-names>N.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <source>Technical Summary</source>. <publisher-loc>Cambridge, United&#x20;Kingdom and New York, NY, USA</publisher-loc>: <publisher-name>Cambridge University Press</publisher-name>, <fpage>33</fpage>&#x2013;<lpage>115</lpage>. <comment>book section TS</comment>. <pub-id pub-id-type="doi">10.1017/CBO9781107415324.005</pub-id> </citation>
</ref>
<ref id="B91">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Strong</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Magnusdottir</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Stern</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Observed Feedback between Winter Sea Ice and the North Atlantic Oscillation</article-title>. <source>J.&#x20;Clim.</source> <volume>22</volume>, <fpage>6021</fpage>&#x2013;<lpage>6032</lpage>. <pub-id pub-id-type="doi">10.1175/2009jcli3100.1</pub-id> </citation>
</ref>
<ref id="B92">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sturm</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Holmgren</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Perovich</surname>
<given-names>D. K.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Winter Snow Cover on the Sea Ice of the Arctic Ocean at the Surface Heat Budget of the Arctic Ocean (SHEBA): Temporal Evolution and Spatial Variability</article-title>. <source>J.&#x20;Geophys. Res. Oceans</source> <volume>107</volume>, <fpage>SHE 23-1-SHE 23-17</fpage>. <pub-id pub-id-type="doi">10.1029/2000jc000400</pub-id> </citation>
</ref>
<ref id="B93">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Perlwitz</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hoerling</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>What Caused the Recent &#x201c;Warm Arctic, Cold Continents&#x201d; Trend Pattern in Winter Temperatures?</article-title> <source>Geophys. Res. Lett.</source> <volume>43</volume>, <fpage>5345</fpage>&#x2013;<lpage>5352</lpage>. <pub-id pub-id-type="doi">10.1002/2016gl069024</pub-id> </citation>
</ref>
<ref id="B94">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Tan</surname>
<given-names>H. H.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>K. H.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>Vanishing Gradient Mitigation with Deep Learning Neural Network Optimization</article-title>,&#x201d; in <conf-name>2019 7th International Conference on Smart Computing &#x26; Communications (ICSCC)</conf-name>, <conf-loc>Sarawak, Malaysia</conf-loc>, <conf-date>June 28&#x2013;30, 2019</conf-date> (<publisher-name>IEEE</publisher-name>), <fpage>1</fpage>&#x2013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1109/icscc.2019.8843652</pub-id> </citation>
</ref>
<ref id="B95">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Taylor</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Kato</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Covariance between Arctic Sea Ice and Clouds within Atmospheric State Regimes at the Satellite Footprint Level</article-title>. <source>J.&#x20;Geophys. Res. Atmos.</source> <volume>120</volume>, <fpage>12656</fpage>&#x2013;<lpage>12678</lpage>. <pub-id pub-id-type="doi">10.1002/2015jd023520</pub-id> </citation>
</ref>
<ref id="B96">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Top&#xe1;l</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Mitchell</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Baxter</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Herein</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Haszpra</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>An Internal Atmospheric Process Determining Summertime Arctic Sea Ice Melting in the Next Three Decades: Lessons Learned from Five Large Ensembles and Multiple CMIP5 Climate Simulations</article-title>. <source>J.&#x20;Clim.</source> <volume>33</volume>, <fpage>7431</fpage>&#x2013;<lpage>7454</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-19-0803.1</pub-id> </citation>
</ref>
<ref id="B97">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Van de Geer</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>B&#xfc;hlmann</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>
<italic>l</italic>
<sub>0</sub>-penalized Maximum Likelihood for Sparse Directed Acyclic Graphs</article-title>. <source>Ann. Stat.</source> <volume>41</volume>, <fpage>536</fpage>&#x2013;<lpage>567</lpage>. <pub-id pub-id-type="doi">10.1214/13-aos1085</pub-id> </citation>
</ref>
<ref id="B98">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Graham</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Gerland</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Granskog</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Comparison of ERA5 and ERA-Interim Near-Surface Air Temperature, Snowfall and Precipitation over Arctic Sea Ice: Effects on Sea Ice Thermodynamics and Evolution</article-title>. <source>The Cryosphere</source> <volume>13</volume>, <fpage>1661</fpage>&#x2013;<lpage>1679</lpage>. <pub-id pub-id-type="doi">10.5194/tc-13-1661-2019</pub-id> </citation>
</ref>
<ref id="B99">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Watanabe</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Ikeda</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mizobata</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Walsh</surname>
<given-names>J.&#x20;E.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Is the Dipole Anomaly a Major Driver to Record Lows in Arctic Summer Sea Ice Extent?</article-title>. <source>Geophys. Res. Lett.</source> <volume>36</volume>, <fpage>L05706</fpage>. <pub-id pub-id-type="doi">10.1029/2008gl036706</pub-id> </citation>
</ref>
<ref id="B100">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Watanabe</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sumi</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Hasumi</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2006</year>). <article-title>Arctic Dipole Anomaly and its Contribution to Sea Ice export from the Arctic Ocean in the 20th century</article-title>. <source>Geophys. Res. Lett.</source> <volume>33</volume>, <fpage>L23703</fpage>. <pub-id pub-id-type="doi">10.1029/2006gl028112</pub-id> </citation>
</ref>
<ref id="B101">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weber</surname>
<given-names>R. O.</given-names>
</name>
<name>
<surname>Talkner</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Spectra and Correlations of Climate Data from Days to Decades</article-title>. <source>J.&#x20;Geophys. Res.</source> <volume>106</volume>, <fpage>20131</fpage>&#x2013;<lpage>20144</lpage>. <pub-id pub-id-type="doi">10.1029/2001jd000548</pub-id> </citation>
</ref>
<ref id="B102">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>Q.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>Self-Learning Optimal Control of Nonlinear Systems : Adaptive Dynamic Programming Approach</article-title>,&#x201d; in <source>Studies in Systems, Decision and Control</source> (<publisher-loc>Singapore</publisher-loc>: <publisher-name>Springer Singapore</publisher-name>), <volume>103</volume>. </citation>
</ref>
<ref id="B103">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Overland</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>D&#x2019;Arrigo</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Anomalous Arctic Surface Wind Patterns and Their Impacts on September Sea Ice Minima and Trend</article-title>. <source>Tellus A: Dynamic Meteorology and Oceanography</source> <volume>64</volume>, <fpage>18590</fpage>. <pub-id pub-id-type="doi">10.3402/tellusa.v64i0.18590</pub-id> </citation>
</ref>
<ref id="B104">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>N. E.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>S. R.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>C.-K.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>On the Trend, Detrending, and Variability of Nonlinear and Nonstationary Time Series</article-title>. <source>Proc. Natl. Acad. Sci.</source> <volume>104</volume>, <fpage>14889</fpage>&#x2013;<lpage>14894</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0701020104</pub-id> </citation>
</ref>
<ref id="B105">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Simmonds</surname>
<given-names>I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Increased Quasi Stationarity and Persistence of winter Ural Blocking and Eurasian Extreme Cold Events in Response to Arctic Warming. Part I: Insights from Observational Analyses</article-title>. <source>J.&#x20;Clim.</source> <volume>30</volume>, <fpage>3549</fpage>&#x2013;<lpage>3568</lpage>. <pub-id pub-id-type="doi">10.1175/jcli-d-16-0261.1</pub-id> </citation>
</ref>
<ref id="B106">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Sch&#xfc;tze</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Zhou</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>ABCNN: Attention-Based Convolutional Neural Network for Modeling Sentence Pairs</article-title>. <source>Tacl.</source> <volume>4</volume>, <fpage>259</fpage>&#x2013;<lpage>272</lpage>. <pub-id pub-id-type="doi">10.1162/tacl_a_00097</pub-id> </citation>
</ref>
<ref id="B107">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Yu</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). &#x201c;<article-title>DAG-GNN: DAG Structure Learning with Graph Neural Networks</article-title>,&#x201d; in <conf-name>Proceedings of the 36th International Conference on Machine Learning</conf-name>, <conf-loc>Long Beach, CA, United States</conf-loc>, <conf-date>June 9&#x2013;15, 2019</conf-date>. <comment>Code available on: <ext-link ext-link-type="uri" xlink:href="https://github.com/fishmoon1234/DAG-GNN">https://github.com/fishmoon1234/DAG-GNN</ext-link>
</comment>. </citation>
</ref>
<ref id="B108">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zerenner</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Friederichs</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Lehnertz</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Hense</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>A Gaussian Graphical Model Approach to Climate Networks</article-title>. <source>Chaos</source> <volume>24</volume>, <fpage>023103</fpage>. <pub-id pub-id-type="doi">10.1063/1.4870402</pub-id> </citation>
</ref>
<ref id="B109">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Sch&#xf6;lkopf</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Spirtes</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Glymour</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Learning Causality and Causality-Related Learning: Some Recent Progress</article-title>. <source>Natl. Sci. Rev.</source> <volume>5</volume>, <fpage>26</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1093/nsr/nwx137</pub-id> </citation>
</ref>
<ref id="B110">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Polyakov</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Gerdes</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Inoue</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2013</year>). <article-title>Enhanced Poleward Moisture Transport and Amplified Northern High-Latitude Wetting Trend</article-title>. <source>Nat. Clim Change</source> <volume>3</volume>, <fpage>47</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1038/nclimate1631</pub-id> </citation>
</ref>
<ref id="B111">
<citation citation-type="confproc">
<person-group person-group-type="author">
<name>
<surname>Zheng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Aragam</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Ravikumar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Xing</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2018</year>). &#x201c;<article-title>DAGs with NO TEARS: Continuous Optimization for Structure Learning</article-title>,&#x201d; in <conf-name>Conference on Neural Information Processing Systems</conf-name>, <conf-loc>Montr&#xe9;al, Canada</conf-loc>, <conf-date>December 2&#x2013;8, 2018</conf-date>. (<publisher-name>NeurIPS</publisher-name>). <comment>Code available on: <ext-link ext-link-type="uri" xlink:href="https://github.com/xunzheng/notears">https://github.com/xunzheng/notears</ext-link>
</comment>. </citation>
</ref>
</ref-list>
</back>
</article>