<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Med.</journal-id>
<journal-title>Frontiers in Medicine</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Med.</abbrev-journal-title>
<issn pub-type="epub">2296-858X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fmed.2021.775047</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Medicine</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>An Interpretable Early Dynamic Sequential Predictor for Sepsis-Induced Coagulopathy Progression in the Real-World Using Machine Learning</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Cui</surname> <given-names>Ruixia</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Hua</surname> <given-names>Wenbo</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x02020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Qu</surname> <given-names>Kai</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Yang</surname> <given-names>Heran</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1500843/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Tong</surname> <given-names>Yingmu</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Li</surname> <given-names>Qinglin</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Hai</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Ma</surname> <given-names>Yanfen</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Liu</surname> <given-names>Sinan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Lin</surname> <given-names>Ting</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Zhang</surname> <given-names>Jingyao</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1475764/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Sun</surname> <given-names>Jian</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1501340/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Liu</surname> <given-names>Chang</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x0002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1511805/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Hepatobiliary Surgery, The First Affiliated Hospital of Xi&#x00027;an Jiaotong University</institution>, <addr-line>Xi&#x00027;an</addr-line>, <country>China</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of SICU, The First Affiliated Hospital of Xi&#x00027;an Jiaotong University</institution>, <addr-line>Xi&#x00027;an</addr-line>, <country>China</country></aff>
<aff id="aff3"><sup>3</sup><institution>School of Mathematics and Statistics, Xi&#x00027;an Jiaotong University</institution>, <addr-line>Xi&#x00027;an</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Clinical Laboratory, The First Affiliated Hospital of Xi&#x00027;an Jiaotong University</institution>, <addr-line>Xi&#x00027;an</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Biobank, The First Affiliated Hospital of Xi&#x00027;an Jiaotong University</institution>, <addr-line>Xi&#x00027;an</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Zhongheng Zhang, Sir Run Run Shaw Hospital, China</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Jesus Rico-Feijoo, Hospital Universitario R&#x000ED;o Hortega, Spain; Takeshi Wada, Hokkaido University, Japan</p></fn>
<corresp id="c001">&#x0002A;Correspondence: Jingyao Zhang <email>jingyaozhang&#x00040;xjtu.edu.cn</email></corresp>
<corresp id="c002">Jian Sun <email>jiansun&#x00040;xjtu.edu.cn</email></corresp>
<corresp id="c003">Chang Liu <email>liuchangfh&#x00040;xjtu.edu.cn</email></corresp>
<fn fn-type="other" id="fn001"><p>This article was submitted to Intensive Care Medicine and Anesthesiology, a section of the journal Frontiers in Medicine</p></fn>
<fn fn-type="equal" id="fn002"><p>&#x02020;These authors have contributed equally to this work</p></fn></author-notes>
<pub-date pub-type="epub">
<day>03</day>
<month>12</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>8</volume>
<elocation-id>775047</elocation-id>
<history>
<date date-type="received">
<day>13</day>
<month>09</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>11</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x000A9; 2021 Cui, Hua, Qu, Yang, Tong, Li, Wang, Ma, Liu, Lin, Zhang, Sun and Liu.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Cui, Hua, Qu, Yang, Tong, Li, Wang, Ma, Liu, Lin, Zhang, Sun and Liu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license></permissions>
<abstract><p>Sepsis-associated coagulation dysfunction greatly increases the mortality of sepsis. Irregular clinical time-series data remains a major challenge for AI medical applications. To early detect and manage sepsis-induced coagulopathy (SIC) and sepsis-associated disseminated intravascular coagulation (DIC), we developed an interpretable real-time sequential warning model toward real-world irregular data. Eight machine learning models including novel algorithms were devised to detect SIC and sepsis-associated DIC 8<italic>n</italic> (1 &#x02264; <italic>n</italic> &#x02264; 6) hours prior to its onset. Models were developed on Xi&#x00027;an Jiaotong University Medical College (XJTUMC) and verified on Beth Israel Deaconess Medical Center (BIDMC). A total of 12,154 SIC and 7,878 International Society on Thrombosis and Haemostasis (ISTH) overt-DIC labels were annotated according to the SIC and ISTH overt-DIC scoring systems in train set. The area under the receiver operating characteristic curve (AUROC) were used as model evaluation metrics. The eXtreme Gradient Boosting (XGBoost) model can predict SIC and sepsis-associated DIC events up to 48 h earlier with an AUROC of 0.929 and 0.910, respectively, and even reached 0.973 and 0.955 at 8 h earlier, achieving the highest performance to date. The novel ODE-RNN model achieved continuous prediction at arbitrary time points, and with an AUROC of 0.962 and 0.936 for SIC and DIC predicted 8 h earlier, respectively. In conclusion, our model can predict the sepsis-associated SIC and DIC onset up to 48 h in advance, which helps maximize the time window for early management by physicians.</p></abstract>
<kwd-group>
<kwd>SIC</kwd>
<kwd>sepsis-associated DIC</kwd>
<kwd>irregular time-series data</kwd>
<kwd>early real-time prediction</kwd>
<kwd>machine learning</kwd>
</kwd-group>
<counts>
<fig-count count="8"/>
<table-count count="2"/>
<equation-count count="2"/>
<ref-count count="36"/>
<page-count count="13"/>
<word-count count="7274"/>
</counts>
</article-meta>
</front>
<body>
<sec sec-type="intro" id="s1">
<title>Introduction</title>
<p>Sepsis is a lethal disease caused by a dysregulated host response in an infected state (<xref ref-type="bibr" rid="B1">1</xref>). Septic-induced organ dysfunction is a major cause of sepsis high mortality (<xref ref-type="bibr" rid="B2">2</xref>). Among these, coagulation dysfunction is a pervasive complication of sepsis, occurring in 50&#x02013;70% of sepsis patients, while approximately 35% of patients proceed to disseminated intravascular coagulation (DIC) (<xref ref-type="bibr" rid="B3">3</xref>). Sepsis-induced coagulopathy (SIC) mortality reaches to 23.1% (<xref ref-type="bibr" rid="B4">4</xref>), while the mortality rate of sepsis-associated DIC is more than twice that of simple sepsis patients (<xref ref-type="bibr" rid="B5">5</xref>, <xref ref-type="bibr" rid="B6">6</xref>). According to the SIC scoring system proposed by the DIC subcommittee of International Society on Thrombosis and Haemostasis (ISTH) in 2017, sepsis patients easily meet the SIC diagnostic criteria (<xref ref-type="bibr" rid="B7">7</xref>). Sepsis-associated DIC was diagnosed by the two-step sequential approach of SIC and ISTH overt-DIC criteria, which is a late-phase coagulation disorder that should be detected early (<xref ref-type="bibr" rid="B8">8</xref>). Currently, DIC diagnosis does not have a gold standard. Physicians diagnose DIC according to the primary disease, clinical manifestations, and laboratory tests. However, the clinical signs and symptoms of DIC appear slowly and the manifestations are complex and varied, resulting in a time lag in the clinical diagnosis of DIC, which places the patient in a treatment-refractory phase when sepsis-associated DIC is clinically determined (<xref ref-type="bibr" rid="B9">9</xref>). In addition, studies have shown that anticoagulation is ineffective in both sepsis and SIC patients, but effective in sepsis-induced DIC patients (<xref ref-type="bibr" rid="B10">10</xref>&#x02013;<xref ref-type="bibr" rid="B12">12</xref>). Hence, early recognition of sepsis-associated DIC is more important than SIC, while there are currently no studies on sequential prediction of sepsis-associated DIC after SIC alerts. Therefore, it is imperative to establish a model for early sequential real-time prediction of SIC and sepsis-associated DIC.</p>
<p>The prevalence of electronic health records (EHRs) and the upsurge of artificial intelligence (AI) provide opportunities for clinical medical research (<xref ref-type="bibr" rid="B13">13</xref>). Studies have shown that machine learning-based models outperform traditional clinical scoring and human expert systems in the diagnosis, treatment, and prognosis prediction of clinical diseases (<xref ref-type="bibr" rid="B14">14</xref>, <xref ref-type="bibr" rid="B15">15</xref>). However, current clinical prediction studies are mainly static and lack real-time prediction studies. Real-time prediction models dynamically predict the onset of disease within a sliding time-window by continuously updating clinical data. From the clinical dynamic treatment perspective, real-time predictive models would better fit the clinical applications (<xref ref-type="bibr" rid="B16">16</xref>). In addition, the variability of primary diseases, comorbidities and severity of conditions in ICU patients leads to sparse and irregular clinical data in terms of sampling time and dimensions (<xref ref-type="bibr" rid="B17">17</xref>). To accommodate irregular time series data, the existing standard models such as eXtreme Gradient Boosting (XGBoost) (<xref ref-type="bibr" rid="B18">18</xref>) and Recurrent Neural Network (RNN) (<xref ref-type="bibr" rid="B19">19</xref>) decompose time into continuous, non-overlapping uniform intervals, known as temporal discretization (<xref ref-type="bibr" rid="B20">20</xref>). This enables the standard models to act on fixed dimensional vectors (regular data). However, this approach lacks the continuity principle and can lead to undesirable results when applied to irregular medical time-series data (<xref ref-type="bibr" rid="B21">21</xref>). Altogether, it is necessary to develop a model that is specifically designed to handle sparse irregular time series data in the real clinical world to achieve real-time accurate predictions at arbitrary time points.</p>
<p>In summary, we aim to help physicians to identify patients at high risk of SIC and sepsis-associated DIC early, especially those who progress to DIC after SIC, as well as improve existing machine learning models to enable arbitrary time-point prediction on real-world irregular data. To achieve this, an interpretable early real-time sequential warning predictor will be developed that contributes to early personalized treatment and reasonable administration. The overview of the study design and model development was shown in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>Figure 1</label>
<caption><p>Study design and model development overview. <bold>(A)</bold> Research application design profile. Study developed an early real-time prediction model to dynamically predict disease progression of sepsis patients after admission to ICU, and to output whether the patient will suffer from SIC and sepsis-associated DIC and the risk score for their onset in future periods. The model feeds into the information obtained from a continuous 24 h sampling time-window and outputs the disease status for the next 8<italic>n</italic> h in real-time. The x-axis indicates the time since admission. <bold>(B)</bold> Model development overview. The research process comprises to data processing, model development, model evaluation, and interpretation. The data processing process includes raw data extraction, outlier processing, coagulation status annotation, and feature engineering. The model development stage included feature set split, sampling time-window selection pre-experimental, model construction, and training. We built eight models, trained and selected the Full model with good performance on the internal validation set by SGD or Adam optimization. The Lite models were developed by selecting easily accessible and important features through SHAP and Occlusion analysis. Models were validated at BIDMC for external validation. The model evaluation and interpretation section include the assessment of model predictive performance, interpretation of model outputs, individualized disease trajectory prediction, etc.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0001.tif"/>
</fig>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec>
<title>Study Cohort and Design</title>
<p>This is a multicenter retrospective cohort study. Research data were obtained from two medical centers, the Xi&#x00027;an Jiaotong University Medical College (XJTUMC) and Beth Israel Deaconess Medical Center (BIDMC). Structured query language (SQL) was used to obtain eligible patient data for the period from January 1, 2013 to December 1, 2018 in XJTUMC and from 2001 to 2012 in BIDMC, respectively. The XJTUMC data were obtained from the Center&#x00027;s Biobank and the BIDMC data were obtained from the Medical Information Mark for Intensive Care (MIMIC-III) database (<xref ref-type="bibr" rid="B22">22</xref>). The study was reviewed by the Ethics Committee of the First Affiliated Hospital of Xi&#x00027;an Jiaotong University, and all data were deidentified.</p>
<p>The enrollment process was shown in <xref ref-type="fig" rid="F2">Figure 2</xref>. The inclusion criteria were as follows: (1) sepsis was diagnosed within 24 h of admission based on Sepsis 3.0 criteria; (2) the age was not &#x0003C;18 years; and (3) the duration of hospitalization was not &#x0003C;3 days. The exclusion criteria were as follows: (1) patients with DIC onset within 24 h of admission; (2) patients were affected by hematologic tumors (leukemia, lymphoma, etc.); (3) patients suffering from cirrhosis, acute liver failure, with liver function up to Child C; (4) patients treated with radiotherapy or chemotherapy; (5) patients with admission diagnosis of combat trauma, traumatic coagulopathy; (6) patients with pregnancy or perinatal complications.</p>
<fig id="F2" position="float">
<label>Figure 2</label>
<caption><p>The diagram of study patient enrollment. In XJTUMC, coagulation status annotation was based on SIC and ISTH-overt DIC criteria. In BIDMC, DIC were labeled based on ICD-9. ICD, International Classification of Diseases.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0002.tif"/>
</fig>
</sec>
<sec>
<title>Data Preprocessing</title>
<p>We initially obtained a total of 174 laboratory features in XJTUMC and 259 laboratory features in BIDMC. Subsequently, we performed the process of merging identical variables (e.g., HGB with different units of g/L or g/dl, HGB in blood count and blood gas test, etc.), eliminating irrelevant variables (e.g., hepatitis antibody quantification, blood drug concentration, etc.), and counting the frequency of variable detection. We removed indictors that were completely missing and detected &#x0003C;1% of indicators at all-time points. In addition, we performed the unit conversions for the XJTUMC laboratory test variables, in order to maintain consistency with BIDMC. Ultimately, under the guidance of the laboratory physicians, we identified 99 features at XJTUMC and 72 features at BIDMC. Of these, the 72 features at BIDMC were common features for both medical centers. The missing information for both medical centers were shown in the <xref ref-type="supplementary-material" rid="SM1">Supplementary Figure 1</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>). And the clinical reportable ranges for each identified variable was shown in <xref ref-type="supplementary-material" rid="SM2">Supplementary File 2</xref>. All variables were initialized by the min-max normalization algorithm.</p>
<p>Clinical sequence data are sparse and irregular, manifested by the presence of a large amount of missing data. Whereas, the pattern of missing data contains important information, such as the correlation between the frequency of a certain marker test and the severity of the disease. Therefore, in this study, we do not deal with missing data. Instead, we use the modeling of missing information to identify the role of missing patterns in prediction, which enhances the model prediction effectiveness. In brief, it is modeled by learning to characterize the missing and hidden information from the time-series data, which is then further introduced into the model network. The multivariate time series <italic>X</italic> &#x0003D; {<italic>x</italic><sub>1</sub>, <italic>x</italic><sub>2</sub>, &#x02026;, <italic>x</italic><sub><italic>T</italic></sub>} is the observations at time <italic>T</italic>. <inline-formula><mml:math id="M1"><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>&#x02208;</mml:mo><mml:msup><mml:mrow><mml:mi>R</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:msup></mml:math></inline-formula>represents the observations at time <italic>t</italic> for all variables. <italic>x</italic><sub><italic>t</italic></sub> contains <italic>D</italic> features <inline-formula><mml:math id="M2"><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:math></inline-formula> and <inline-formula><mml:math id="M3"><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> represents the <italic>d</italic>-th feature variable of <italic>x</italic><sub><italic>t</italic></sub>. <italic>s</italic><sub><italic>t</italic></sub> denotes the timestamp of observation <italic>x</italic><sub><italic>t</italic></sub>. We assume that the timestamp of the first observation is 0 (<italic>s</italic><sub><italic>t</italic></sub> = 0), the time interval between different timestamps may be the same or different. &#x00394; indicates adjacent time steps for each variable. To provide an efficient representation of the missing values, we introduce the mask vector <inline-formula><mml:math id="M4"><mml:msubsup><mml:mrow><mml:mi>m</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:mn>1</mml:mn></mml:mrow><mml:mo>}</mml:mo></mml:mrow></mml:math></inline-formula> to represent the missing variables in <italic>x</italic><sub><italic>t</italic></sub> at time <italic>t</italic>. Some features are missing continuously over a period of time, and <inline-formula><mml:math id="M5"><mml:msubsup><mml:mrow><mml:mi>&#x003B4;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msubsup></mml:math></inline-formula> is defined to represent the time interval between the last observation and the current timestamp. To be more specific, we have:</p>
<disp-formula id="E1"><label>(1)</label><mml:math id="M6"><mml:mrow><mml:msubsup><mml:mi>m</mml:mi><mml:mi>t</mml:mi><mml:mi>d</mml:mi></mml:msubsup><mml:mtext>&#x000A0;</mml:mtext><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:mn>1</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi>i</mml:mi><mml:mi>f</mml:mi><mml:mtext>&#x000A0;</mml:mtext><mml:msubsup><mml:mi>x</mml:mi><mml:mi>t</mml:mi><mml:mi>d</mml:mi></mml:msubsup><mml:mtext>&#x000A0;</mml:mtext><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mtext>&#x000A0;</mml:mtext><mml:mi>o</mml:mi><mml:mi>b</mml:mi><mml:mi>s</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi><mml:mi>v</mml:mi><mml:mi>e</mml:mi><mml:mi>d</mml:mi></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:mn>0</mml:mn><mml:mo>,</mml:mo></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi>o</mml:mi><mml:mi>t</mml:mi><mml:mi>h</mml:mi><mml:mi>e</mml:mi><mml:mi>r</mml:mi><mml:mi>w</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>e</mml:mi></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mrow></mml:mrow></mml:math></disp-formula>
<disp-formula id="E2"><label>(2)</label><mml:math id="M7"><mml:mrow><mml:msubsup><mml:mi>&#x003B4;</mml:mi><mml:mi>t</mml:mi><mml:mi>d</mml:mi></mml:msubsup><mml:mtext>&#x000A0;</mml:mtext><mml:mo>=</mml:mo><mml:mrow><mml:mo>{</mml:mo><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>&#x02212;</mml:mo><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x02212;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msubsup><mml:mi>&#x003B4;</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x02212;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>d</mml:mi></mml:msubsup></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x0003E;</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:msubsup><mml:mi>m</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x02212;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>d</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>0</mml:mn></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mrow><mml:msub><mml:mi>s</mml:mi><mml:mi>t</mml:mi></mml:msub><mml:mo>&#x02212;</mml:mo><mml:msub><mml:mi>s</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x02212;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:msub></mml:mrow></mml:mtd><mml:mtd><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x0003E;</mml:mo><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mtext>&#x000A0;</mml:mtext><mml:msubsup><mml:mi>m</mml:mi><mml:mrow><mml:mi>t</mml:mi><mml:mo>&#x02212;</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>d</mml:mi></mml:msubsup><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mn>0</mml:mn></mml:mtd><mml:mtd><mml:mrow><mml:mi>t</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mtd></mml:mtr></mml:mtable></mml:mrow></mml:mrow></mml:mrow></mml:math></disp-formula>
<p>Thus, a dynamic feature of the input would be represented as <inline-formula><mml:math id="M8"><mml:msub><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:mrow><mml:msubsup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>m</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:mi>&#x00394;</mml:mi><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>&#x003B4;</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msubsup></mml:mrow><mml:mo stretchy="false">)</mml:mo></mml:mrow></mml:math></inline-formula>. In the later section, the missing information will be introduced into the model for subsequent processing when improving the algorithm model.</p>
</sec>
<sec>
<title>Ground-Truth Labels Using ISTH</title>
<p>We defined all three disease states according to SIC and ISTH overt-DIC criteria. The details of the disease status annotation criteria can be found in <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 1</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>). New data were not available for all 8 h time-window of the day because the patient&#x00027;s laboratory tests were irregular. If there are no updated data available for labeling in an 8 h time-window, then the forward interpolation method is used for labeling based on the labels before and after that time-window. More specific details were shown in <xref ref-type="supplementary-material" rid="SM2">Supplementary Figure 2</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>).</p>
</sec>
<sec>
<title>Continuous Models for Irregular Time Series</title>
<p>The study compared two methods for dealing with irregular time series. The first is the temporal discretization approach, in which the standard RNN model is a typical model. In the second approach, we tackle the irregular time-series problem by modeling the missing information. Based on the standard RNN model, we introduced a decay mechanism for modeling missing information by referencing Che et al.&#x00027;s study (<xref ref-type="bibr" rid="B21">21</xref>), to eventually develop the RNN-Decay model. In addition, we developed the Ordinary Differential Equations-Recurrent Neural Networks (ODE-RNN) model by directly modeling the unequally spaced raw data referring to the work of Yulia et al. (<xref ref-type="bibr" rid="B23">23</xref>). The model architecture diagrams were shown in <xref ref-type="fig" rid="F3">Figure 3</xref>. The model inputs are derived from the extraction of missing patterns of time series information from &#x0201C;Data Processing&#x0201D; described in the above section.</p>
<fig id="F3" position="float">
<label>Figure 3</label>
<caption><p>Architecture diagram of different RNN-based models for processing irregular time-series data<bold>. (A)</bold> Diagram of the standard RNN model processing irregular time-series data. The standard RNN transmits the hidden layer information forward at a fixed time interval without processing the hidden layer information; <bold>(B)</bold> Diagram of RNN-Decay model processing irregular time-series data. Based on the RNN framework, RNN-decay adds temporal decay derived from time intervals to the latent space in order to indirectly process irregular series; however, the longer the time interval, the weaker the information conveyed. <bold>(C)</bold> Diagram of ODE-RNN model processing irregular time-series data. The ODE-RNN directly modeled the unequally spaced raw data, and propagated a latent variable along the time interval using the Neural ODE to solve the latent layer information that corresponds to the irregular timestamp; this allows the arbitrary time-point data to be processed and guarantees temporal continuity. The time series <italic>T</italic> &#x0003D; {<italic>t</italic><sub>0</sub>, <italic>t</italic><sub>1</sub>, &#x02026;, <italic>t</italic><sub><italic>N</italic></sub>} is the observation timestamps, <italic>X</italic> &#x0003D; {<italic>x</italic><sub>0</sub>, <italic>x</italic><sub>1</sub>, &#x02026;, <italic>x</italic><sub><italic>N</italic></sub>} represents the observations at time <italic>t</italic> for all variables, <italic>h</italic>(<italic>t</italic>) is the latent space state corresponding to timestamp <italic>t</italic>. Orange circles indicate an RNN unit. Blue and black dashed lines with arrows indicate the shallow and latent features of the input RNN, and orange dashed lines with arrows indicate data from the previous RNN unit that has been processed in a different way and then fed into the next RNN unit.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0003.tif"/>
</fig>
</sec>
<sec>
<title>Model Development</title>
<p>To select the appropriate sampling time length, we chose 8, 24, and 48 h sampling time-window to perform pre-experiments. The results were presented in the <xref ref-type="supplementary-material" rid="SM1">Supplementary Table 2</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>). Finally, we set the sampling time-window to 24 h and the sliding time-step to 8 h. Then, we developed several state-of-the-art models that are widely used as follows: (1) Classic machine learning models: Logistic regression (LR) (<xref ref-type="bibr" rid="B24">24</xref>) and support vector machines (SVM) (<xref ref-type="bibr" rid="B25">25</xref>), which are the most commonly used algorithms in existing research; (2) Enhanced machine learning models: gradient boosting machine (LightGBM) (<xref ref-type="bibr" rid="B26">26</xref>) and XGBoost (<xref ref-type="bibr" rid="B27">27</xref>), which are widely regarded as the best algorithm for data prediction and are adopted by many competition winning models in the field of machine learning; (3) Classic deep learning models: RNN (<xref ref-type="bibr" rid="B21">21</xref>) and long short-term memory network (LSTM) (<xref ref-type="bibr" rid="B28">28</xref>), which are the most commonly chosen deep learning models in time-series data, which have shown excellent performance in several time series studies; (4) Improved deep learning models: RNN-Decay and ODE-RNN. The detailed method was described in <xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>. After evaluating the performance, we finally chose the highest-performing XGBoost model as our predictor.</p>
</sec>
<sec>
<title>Model Evaluation</title>
<p>We random divided the XJTUMC data into a train set (70%), a valid set (10%), and a test set (20%). The BIDMC data ware used as the external validation set to evaluate generalization ability of the model. Parameter optimization were performed by Stochastic Gradient Descent (SGD) or the Adam algorithm. The area under the receiver operating characteristic curve (AUROC), the area under the precision-recall curve (AUPRC) and the F1-score were used as model evaluation metrics. Test samples were resampled 1,000 times using bootstrapping to calculate 95% confidence intervals.</p>
</sec>
<sec>
<title>Model Interpretation</title>
<p>In this study, we interpreted the machine learning model results using the Shapley Additive exPlanations (SHAP) algorithm (<xref ref-type="bibr" rid="B29">29</xref>) and the deep learning model results using Occlusion analysis (<xref ref-type="bibr" rid="B30">30</xref>).</p>
</sec>
<sec>
<title>Statistical Analysis</title>
<p>Baseline data are skewed and expressed as the median and interquartile range (IQR). Non-parametric tests were used for statistical tests. <italic>P</italic>-values &#x0003C; 0.001 were considered statistically significant. Navicat Premium (12.1.22), Pytorch (1.7.0), and Python (3.7.6) with Numpy (1.18.5), Pandas (1.1.5), and Scikit-learn (0.23.2) formed the data-processing pipeline. All computational analyses were performed in the Computer Center of the School of Mathematics, Xi&#x00027;an Jiaotong University.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec>
<title>Study Baseline</title>
<p>A total of 9,717 infection patients in XJTUMC and 15,059 sepsis patients in BIDMC were initially included when applying ICD-9 codes and sepsis 3.0 criteria. After applying the exclusion criteria, 3,809 and 11, 926 patients were left. We then annotated the coagulation status of 3,809 XJTUMC sepsis patients by SIC and ISTH overt-DIC criteria, a total of 12,154 SIC status labels (positive: 8,909; negative: 3,246); and 7,878 overt-DIC status labels (positive: 3,051; negative: 4,827); were available in XJTUMC. Also, we selected 296 patients (1,210 status labels) who developed DIC during hospitalization at the BIDMC center using ICD-9 codes. The baseline characteristics of included patients at XJTUMC and BIDMC were shown in <xref ref-type="table" rid="T1">Table 1</xref>. For both XJTUMC and BIDMC, the median age of sepsis patients is above 60 years and the predominant cause of sepsis was respiratory system-derived infections. Also, 652/1,415 (46.1%) of SIC patients developed to DIC, while 652/679 (96%) of DIC patients fulfilled the SIC diagnosis.</p>
<table-wrap position="float" id="T1">
<label>Table 1</label>
<caption><p>Baseline characteristics of included patients at XJTUMC and BIDMC.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th/>
<th valign="top" align="center"><bold>XJTUMC (<italic>n</italic> &#x0003D; 3,809)</bold></th>
<th valign="top" align="center"><bold>BIDMC (<italic>n</italic> &#x0003D; 11,926)</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left" colspan="3">Demographic</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Age (year), median [Q1, Q3]</td>
<td valign="top" align="center">63 [52,72]</td>
<td valign="top" align="center">69 [57,80]</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Male, <italic>n</italic> (%)</td>
<td valign="top" align="center">2,388 (62.7)</td>
<td valign="top" align="center">6,481 (54.3)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Severity status at admission</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;SOFA score, median [Q1, Q3]</td>
<td valign="top" align="center">3 [3, 4]</td>
<td valign="top" align="center">4 [5, 8]</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Infection sources in sepsis, <italic>n</italic> (%)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Respiratory system</td>
<td valign="top" align="center">1,702 (44.7)</td>
<td valign="top" align="center">4,957 (41.6)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Gastrointestinal system</td>
<td valign="top" align="center">1,435 (37.7)</td>
<td valign="top" align="center">3,194 (26.8)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Urinary system</td>
<td valign="top" align="center">5 (0.1)</td>
<td valign="top" align="center">382 (3.2)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Cardiac bloodstream system</td>
<td valign="top" align="center">24 (0.6)</td>
<td valign="top" align="center">728 (6.1)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Oncology cachexia related</td>
<td valign="top" align="center">567 (14.9)</td>
<td valign="top" align="center">1,077 (9.0)</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Other</td>
<td valign="top" align="center">76 (2.0)</td>
<td valign="top" align="center">1,588 (13.3)</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Outcome, median [Q1, Q3]</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;Hospital stay (day)</td>
<td valign="top" align="center">7 [10, 15]</td>
<td valign="top" align="center">13 [7, 23]</td>
</tr>
<tr>
<td valign="top" align="left" colspan="3">Coagulation status</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;SIC onset, <italic>n</italic> (%)</td>
<td valign="top" align="center">1,415 (37.1)<xref ref-type="table-fn" rid="TN1"><sup>a</sup></xref></td>
<td valign="top" align="center">Unknown</td>
</tr>
<tr>
<td valign="top" align="left">&#x000A0;&#x000A0;DIC onset, <italic>n</italic> (%)</td>
<td valign="top" align="center">679 (17.8)<xref ref-type="table-fn" rid="TN1"><sup>a</sup></xref></td>
<td valign="top" align="center">296 (2.5)<xref ref-type="table-fn" rid="TN2"><sup>b</sup></xref></td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>For infection sources in sepsis, respiratory system infections mainly cover the lung, trachea, bronchus, and chest related diseases; gastrointestinal system infections typically involve the esophageal, gastric, bowel, liver, spleen, and abdominal related disorders; urinary system infections include renal, ureteral, bladder, and urethra inflammatory diseases; cardiac bloodstream system comprise the cardiac, vascular, vascular catheter, and systemic infection related diseases; oncology cachexia is a variety of malignant diseases and cachectic manifestations; other infections consist of various inflammatory states of unknown etiology and brain diseases.</italic></p>
<fn id="TN1">
<label>a</label>
<p><italic>Diagnosis based on SIC and ISTH-overt DIC criteria for coagulation status annotation.</italic></p></fn>
<fn id="TN2">
<label>b</label>
<p><italic>DIC diagnosis based on International Classification of Diseases-9th edition (ICD9) codes (ICD9 diagnosis code for DIC is 2866)</italic>.</p></fn>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Full Model Performance</title>
<p>The predictive performance of eight different models for early DIC onset were shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. <xref ref-type="fig" rid="F4">Figures 4A,B</xref> showed that XGBoost produced the best prediction performance (AUROC: 0.955; AUPRC: 0.939) and was validated in LightGBM, followed by ODE-RNN (AUROC: 0.936; AUPRC: 0.902). However, ODE-RNN ensures continuity of model prediction, which is more suitable for clinical applications than XGBoost. <xref ref-type="fig" rid="F4">Figure 4C</xref> revealed that the performance of the XGBoost on the BIDMC external validation set has decreased (AUROC: 0.865). <xref ref-type="fig" rid="F4">Figure 4D</xref> provided prediction performance of the model at different prediction time-window, revealing that our model could detect the event as early as 48 h before the ground-truth. <xref ref-type="fig" rid="F5">Figure 5</xref> illustrated the prediction performance for SIC, showing similar results to DIC. <xref ref-type="fig" rid="F5">Figures 5A,B</xref> showed that XGBoost provided the best prediction performance (AUROC: 0.973; AUPRC: 0.979). <xref ref-type="fig" rid="F5">Figure 5C</xref> revealed that the performance of the XGBoost on the BIDMC external validation set has decreased (AUROC: 0.973). <xref ref-type="fig" rid="F5">Figure 5D</xref> revealed that XGBoost could detect the event as early as 48 h before the ground-truth with AUROC reached 0.929. The detailed predictive performance of models at different prediction time-window was shown in <xref ref-type="table" rid="T2">Table 2</xref>. The model prediction performance decreases steadily as the prediction time-window extends. The XGBoost and ODE-RNN still maintain good prediction performance for SIC and DIC in the 48 h ahead of prediction time-window. Furthermore, we examined the early warning performance of the models on SIC and DIC with different alert thresholds at the 8 h prediction time-window, the results were shown in <xref ref-type="supplementary-material" rid="SM1">Supplementary Tables 3</xref>, <xref ref-type="supplementary-material" rid="SM1">4</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>). That allows clinicians to select different thresholds according to the characteristics of the different stages of disease development and treatment needs.</p>
<fig id="F4" position="float">
<label>Figure 4</label>
<caption><p>Full model performance evaluation. <bold>(A)</bold> Receiver operating characteristic curves of models for DIC prediction on the internal test set. <bold>(B)</bold> Precision-recall curve of candidate models for DIC prediction on the internal test set. <bold>(C)</bold> Receiver operating characteristic curves on the external test set. <bold>(D)</bold> The predictive performance of models at 8, 24, and 48 h ahead of sepsis-associated DIC onset. Precision was defined as the fraction of correctly alerted 8 h before the ground-truth event. Recall was defined as the proportion of any alarms 8 h prior to the ground-truth event. The lighter-colored intervals above and below the ROC and PR curves are 95% confidence intervals.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0004.tif"/>
</fig>
<fig id="F5" position="float">
<label>Figure 5</label>
<caption><p>Full model performance evaluation for SIC prediction. <bold>(A)</bold> Receiver operating characteristic curves of models for SIC prediction on the internal test set. <bold>(B)</bold> Precision-recall curve of candidate models for SIC prediction on the internal test set. <bold>(C)</bold> Receiver operating characteristic curves on the external test set. <bold>(D)</bold> The predictive performance of models at 8, 24, and 48 h ahead of SIC onset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0005.tif"/>
</fig>
<table-wrap position="float" id="T2">
<label>Table 2</label>
<caption><p>Model performance at different prediction time-window for SIC and DIC prediction.</p></caption>
<table frame="hsides" rules="groups">
<thead><tr>
<th valign="top" align="left"><bold>Model-AUROC</bold></th>
<th valign="top" align="center" style="border-bottom: thin solid #000000;" colspan="3"><bold>SIC</bold></th>
<th valign="top" align="center" style="border-bottom: thin solid #000000;" colspan="3"><bold>DIC</bold></th>
</tr>
<tr>
<th valign="top" align="left"><bold>Prediction time-window</bold></th>
<th valign="top" align="center"><bold>8 h</bold></th>
<th valign="top" align="center"><bold>24 h</bold></th>
<th valign="top" align="center"><bold>48 h</bold></th>
<th valign="top" align="center"><bold>8 h</bold></th>
<th valign="top" align="center"><bold>24 h</bold></th>
<th valign="top" align="center"><bold>48 h</bold></th>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">LR</td>
<td valign="top" align="center">0.905</td>
<td valign="top" align="center">0.911</td>
<td valign="top" align="center">0.872</td>
<td valign="top" align="center">0.883</td>
<td valign="top" align="center">0.857</td>
<td valign="top" align="center">0.847</td>
</tr>
<tr>
<td valign="top" align="left">SVM</td>
<td valign="top" align="center">0.858</td>
<td valign="top" align="center">0.870</td>
<td valign="top" align="center">0.813</td>
<td valign="top" align="center">0.843</td>
<td valign="top" align="center">0.818</td>
<td valign="top" align="center">0.809</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="center">0.973</td>
<td valign="top" align="center">0.960</td>
<td valign="top" align="center">0.929</td>
<td valign="top" align="center">0.955</td>
<td valign="top" align="center">0.918</td>
<td valign="top" align="center">0.910</td>
</tr>
<tr>
<td valign="top" align="left">LightGBM</td>
<td valign="top" align="center">0.970</td>
<td valign="top" align="center">0.926</td>
<td valign="top" align="center">0.884</td>
<td valign="top" align="center">0.953</td>
<td valign="top" align="center">0.870</td>
<td valign="top" align="center">0.855</td>
</tr>
<tr>
<td valign="top" align="left">RNN</td>
<td valign="top" align="center">0.957</td>
<td valign="top" align="center">0.951</td>
<td valign="top" align="center">0.919</td>
<td valign="top" align="center">0.924</td>
<td valign="top" align="center">0.892</td>
<td valign="top" align="center">0.878</td>
</tr>
<tr>
<td valign="top" align="left">LSTM</td>
<td valign="top" align="center">0.961</td>
<td valign="top" align="center">0.953</td>
<td valign="top" align="center">0.914</td>
<td valign="top" align="center">0.928</td>
<td valign="top" align="center">0.899</td>
<td valign="top" align="center">0.881</td>
</tr>
<tr>
<td valign="top" align="left">RNN-decay</td>
<td valign="top" align="center">0.950</td>
<td valign="top" align="center">0.947</td>
<td valign="top" align="center">0.915</td>
<td valign="top" align="center">0.927</td>
<td valign="top" align="center">0.893</td>
<td valign="top" align="center">0.884</td>
</tr>
<tr>
<td valign="top" align="left">ODE-RNN</td>
<td valign="top" align="center">0.962</td>
<td valign="top" align="center">0.951</td>
<td valign="top" align="center">0.914</td>
<td valign="top" align="center">0.936</td>
<td valign="top" align="center">0.904</td>
<td valign="top" align="center">0.883</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<p><italic>SIC, sepsis-induced coagulopathy; DIC, disseminated intravascular coagulation; LR, logistic regression; SVM, support vector machines; LightGBM, light gradient boosting machine; XGBoost, eXtreme gradient boosting; RNN, recurrent neural network; LSTM, long short-term memory network; RNN-decay, recurrent neural networks-decay; ODE-RNN, ordinary differential equations-recurrent neural networks</italic>.</p>
</table-wrap-foot>
</table-wrap>
</sec>
<sec>
<title>Model Interpretation</title>
<p>To understand the contribution of the features to the model predictions, we interpreted the XGBoost predictions using Shapley values, which were presented in <xref ref-type="fig" rid="F6">Figure 6</xref>. <xref ref-type="fig" rid="F6">Figure 6A</xref> showed the top 20 features that contribute most to the model output; <xref ref-type="fig" rid="F6">Figure 6B</xref> showed the impact of the top 20 features on all samples in the model. Shaply analysis identified that the most valuable features for DIC prediction were platelet (PLT), D-dimer, International normalized ratio (INR), plateletcrit (PCT), fibrinogen (FIB), fibrin degradation products (FDP). We further developed dependency plots to capture the non-linear correlation between a single significant feature and the predicted risk. As an example, <xref ref-type="fig" rid="F6">Figure 6C</xref> showed that when PLT was below 80, the shape-value was significantly increased with higher predicted risk. <xref ref-type="fig" rid="F6">Figure 6D</xref> showed the interaction between PLT and PCT, where when PCT is low, the corresponding PLT feature value is low, SHAP takes a high value and the model output risk increases. In addition, the SHAP force plot provides insight into the output risk and decision factors for specific samples. In the case of <xref ref-type="fig" rid="F6">Figure 6E</xref>, the model predicts the sample at a high risk of a DIC event based on PT, INR, and PLT.</p>
<fig id="F6" position="float">
<label>Figure 6</label>
<caption><p>SHAP-based interpretation of model. <bold>(A)</bold> Overall feature importance of the top 20 features. <bold>(B)</bold> Beeswarm plot showing the impact of the top 20 features across all samples in the model. Beeswarm combines feature importance and feature effect, ranking the features by the sum of the SHAP over all samples (y-axis). In the plot, one row represents one feature and each dot represents the feature SHapley value for one sample, gray dots represent missing values, colors represent feature values (red high, blue low). Long tails indicate that features are extremely important for a particular patient. The x-axis represents the impact on the model output, with positive values pushing risk higher and negative values driving risk lower. <bold>(C)</bold> SHAP dependence plot showing predicted risk vs. feature value for PLT. The x-axis is the range of eigenvalues of PLT features and the y-axis is the shape-value of PLT features. It showed that when PLT was below 80, the shape-value was significantly increased with higher predicted risk. <bold>(D)</bold> SHAP interaction dependency plot describes the relationship between two interaction features and predicted risk. It showed the interaction between PLT and PCT, where when PCT is low, the corresponding PLT feature value is low, SHAP takes a high value and the model output risk increases. <bold>(E)</bold> SHAP force plot shows an interpretable example of single-sample feature prediction results. The base value is the predicted average of the all sample, and the output value is the predicted value of the current sample. Red indicates that the feature increases the risk, blue indicates that the feature decreases the risk. Longer feature bars indicate that the feature is contributing more.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0006.tif"/>
</fig>
<p>In addition, we interpreted the deep learning model ODE-RNN using occlusion analysis, as shown in <xref ref-type="supplementary-material" rid="SM3">Supplementary File 3</xref>. Occlusion analysis showed that a global absence of a single feature has small impact on the model output results for the ODE-RNN model. We also performed univariate and multivariate analyses of baseline data on the first day for different coagulation status groups, as detailed in <xref ref-type="supplementary-material" rid="SM1">Supplementary Tables 5</xref>, <xref ref-type="supplementary-material" rid="SM1">6</xref> (<xref ref-type="supplementary-material" rid="SM1">Supplementary File 1</xref>), suggesting the reliability of the machine learning approach.</p>
<p><xref ref-type="fig" rid="F7">Figure 7</xref> showed an example of real-time sequential prediction using our model on one patient. At each time point after the patient admission over 24 h, the model provides a real-time risk and uncertainty assessment of the future SIC and sepsis-associated DIC onset. This showed that the model could detect SIC and sepsis-associated DIC 48 h early, which is important for clinicians to take precautionary approaches ahead of the event.</p>
<fig id="F7" position="float">
<label>Figure 7</label>
<caption><p>An interpretable real-time risk forecasting example. A 69-year-old male patient was hospitalized with the diagnosis of &#x0201C;Acute biliary pancreatitis, Obstructive jaundice.&#x0201D; The patient was diagnosed with SIC on the third day and sepsis-associated DIC on the fifth day of admission by the clinician. Our model predicted the disease progression earlier than the clinician. The predictions revealed that the most of sepsis-associated DIC events could be accurately predicted up to 8 h earlier. However, there were some sepsis-associated DIC events were still not predicted, mainly in the persistence of DIC onset, which might be related to clinical medicine interventions. The bottom of the graph is the SIC risk score and the upper is the DIC risk score. Red circles indicate sepsis-associated DIC events evaluated by the model. Red stars indicate true future predictions (meeting the ISTH overt-DIC criteria).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0007.tif"/>
</fig>
</sec>
<sec>
<title>Lite Model Development</title>
<p>To enhance the transferability and reduce the data requirements of the model, we selected the ten most influential features based on SHAP values, Occlusion analysis, and clinical practicability (The Lite model feature details were shown in <xref ref-type="supplementary-material" rid="SM2">Supplementary File 2</xref>). Based on the selected features, we constructed the Lite model. <xref ref-type="fig" rid="F8">Figure 8</xref> indicated that the XGBoost-based Lite model achieves the best performance of predicting DIC 8 h in advance, but the model performance is slightly lower than that of the Full model (AUROC: 0.916 vs. 0.955).</p>
<fig id="F8" position="float">
<label>Figure 8</label>
<caption><p>Lite model performance evaluation. <bold>(A)</bold> Receiver operating characteristic curves of XGBoost for DIC. <bold>(B)</bold> Receiver operating characteristic curves of ODE-RNN for DIC.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fmed-08-775047-g0008.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>In this study, we developed two models enabling real-time sequential monitoring of SIC and DIC disease progression in sepsis. The model could identify high-risk patients 48 h before the clinical diagnosis of SIC and sepsis-associated DIC, achieving the state-of-the-art retrospective performance. The full XGBoost model currently achieved the highest prediction performance (SIC: 0.973; DIC: 0.955). The Lite XGBoost model also achieved pleasing prediction performance (DIC: 0.916). On the BIDMC test set, the model performance decreased slightly (DIC: 0.865). In the 8 h prediction time-window with a threshold of 0.7, the XGBoost model was able to predict 89.5% of SIC and 83.1% of sepsis-associated DIC events correctly. Meanwhile, our study has introduced a methodological improvement. Specifically, our study provided the following contributions: (1) We developed and validated the first model for earlier sequential dynamic monitoring of sepsis-induced coagulation disease progression; (2) We processed irregular time-series data for the first time in dynamic prediction research using ODE method, achieving predictions at arbitrary time points; (3) We provided the visual interpretation for deep learning models and machine learning models, respectively, which improved the recognition of physicians toward complex models.</p>
<p>Sepsis-induced SIC, particularly sepsis-associated DIC, is a major cause of increased mortality in sepsis. However, clinical DIC diagnosis relies on FIB and D-Dimer whose laboratory testing frequency is &#x0003C;10% (<xref ref-type="bibr" rid="B31">31</xref>), resulting in a lag in DIC diagnosis. Therefore, it is meaningful to use a full spectrum of laboratory tests for the early detection of coagulation disorders. To our knowledge, there is only one study using machine learning to predict the progression of sepsis-induced DIC that was published in 2020 (<xref ref-type="bibr" rid="B32">32</xref>). Hasegawa et al. performed three classical machine learning methods to predict the progression of sepsis-induced coagulation disorders. In that study, sepsis was defined based on Systemic Inflammatory Response Syndrome (SIRS) criteria rather than sepsis 3.0 criteria. In addition, the study used the static data and the accuracy of the model to predict the progression of coagulopathy was only 59.8&#x02013;67.0% (<xref ref-type="bibr" rid="B32">32</xref>). This is far poorer than our model prediction performance, which suggests that dynamic data monitoring is more consistent with clinical application than static models. In our study, high-risk patients were identified up to 48 h earlier, which suggests that comprehensive use of laboratory tests could detect coagulation disorders earlier. The Lite model also achieves satisfactory predictive performance.</p>
<p>The irregularity of clinical time series data was reflected in the tables as a large number of missing. Previous studies deal with large amounts of missing data by removing missing variables or using statistical interpolation methods, but such methods are not applicable to time series data (<xref ref-type="bibr" rid="B33">33</xref>). Neural ODE is a continuous dynamics theory that can explore the dynamic interactions between key features in the timeline of event onset and development (<xref ref-type="bibr" rid="B34">34</xref>). Our results demonstrate the superiority of ODE in the dynamics of disease. In a recent review, Alber et al. showed that it remains a challenge to apply ODE in medical continuous monitoring studies with incomplete baseline data and low-sampling data (<xref ref-type="bibr" rid="B35">35</xref>). Our study introduced ODE into RNNs and achieved better performance than RNN and LSTM, showing that ODE-RNNs are more appropriate for sparse irregular data than standard deep learning models. However, our results showed that the performance of the ODE-RNN was lower than that of the gradient boosted tree model (XGBoost and LightGBM). We consider that clinical laboratory diagnoses usually use hierarchical stratification for diagnosis, which fits better with the splitting structure of the tree model and gives the tree model a natural advantage. In addition, Qin et al. showed that neural models are not good at efficient feature transformation and scaling, while the tree-based model has an advantage in this respect (<xref ref-type="bibr" rid="B36">36</xref>). However, the flexibility and variety of tasks that can be achieved with deep learning are not available with traditional methods when dealing with complex tabular problems. Furthermore, occlusion analysis showed that a single feature masking does not affect the model significantly, indicating that ODE-RNN has better perturbation resistance. That is, the overall absence of a particular examination does not have a large impact on the ODE-RNN model, suggesting that the ODE-RNN model may have better robustness. Finally, the arbitrary time point continuous prediction achieved by ODE-RNN is also not possible with the gradient boosted tree model, where this arbitrary time point continuity is significant for clinical applications.</p>
<p>Our study offers the following potential benefits: Firstly, it is essential for ICU clinicians and nurses to identify patients who truly need intensive attention and personalized preventive medication. Our predictor can reduce the alarm frequency in patients without a high risk of sepsis-associated DIC occurrence after SIC. Secondly, our ODE-RNN model provides a reference for model selection of real-world irregular time series processing. This will facilitate subsequent studies to build robust models that better match the characteristics of clinical data. Thirdly, our model can be used to identify sepsis patients in different states of coagulation impairment, which could be useful for future randomized controlled clinical studies and further assist physicians to evaluate the time window of anticoagulation therapy appropriately. Finally, our interpretable model provides a visual interactive operating system prototype for early warning systems in ICU and will facilitate clinical deployment of predictive models.</p>
<p>However, some limitations also exist in our study. First of all, our model was developed in a single center, which reduces the effectiveness and may require retraining when the model is migrated to other centers. Furthermore, because we failed to obtain bedside real-time vital sign monitoring data, our model did not incorporate these parameters which may diminish the efficacy of the model. Finally, our study is retrospective and further prospective clinical studies need to be validated.</p>
</sec>
<sec sec-type="conclusions" id="s5">
<title>Conclusion</title>
<p>Our early dynamic sequential predictor enables identification of sepsis patients at high risk of SIC and DIC up to 48 h earlier, achieving the highest performance to date. Our study showed that the ODE-RNN model achieves better performance than the standard RNN model. Our study contributes to early personalized management, and also improves the currently available algorithms.</p>
</sec>
<sec sec-type="data-availability" id="s6">
<title>Data Availability Statement</title>
<p>The raw data supporting the conclusions of this article will be made available by the authors, without undue reservation.</p>
</sec>
<sec id="s7">
<title>Ethics Statement</title>
<p>The studies involving human participants were reviewed and approved by XJTU1AF2020LSL-003. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s8">
<title>Author Contributions</title>
<p>RC designed the experiments, provided and preprocessed the clinical data, developed the supervised learning pipelines, and drafted the manuscript. WH designed the experiments, developed the machine learning pipelines, constructed the deep learning pipelines, and drafted the manuscript. KQ preprocessed the data and carried out the multivariate regression analysis. HY annotated the disease status labels and developed the deep learning pipelines. YT, QL, and HW carried out the data filtering and univariate analysis. YM, SL, and TL defined the clinically reportable range and performed multivariate regression analysis. JZ, JS, and CL revised the manuscript, conceived, and directed the project. All authors read and approved the final manuscript.</p>
</sec>
<sec sec-type="funding-information" id="s9">
<title>Funding</title>
<p>This study was supported by the Critical Clinical Research Project of the First Affiliated Hospital of Xi&#x00027;an Jiaotong University (No. XJTU1AF-CRF-2020-003) and the Joint Project of Universities in Shaanxi Province - Key Project (No. 2021GXLH-Z-099).</p>
</sec>
<sec sec-type="COI-statement" id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s10">
<title>Publisher&#x00027;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
</body>
<back>
<ack><p>We gratefully acknowledge the data support from the Biobank of First Affiliated Hospital of Xi&#x00027;an Jiaotong University, and the MIMIC project from Massachusetts Institute of Technology and the Beth Israel Deaconess Medical Center. We also thank the helpful discussions with Yan Yang, Ph.D., and Dong Yang, Ph.D., School of Mathematics and Statistics, Xi&#x00027;an Jiaotong University. We thank the technician Hui Liu who performed the data quality control, Biobank, the First Affiliated Hospital of Xi&#x00027;an Jiaotong University. Finally, thanks to all reviewers for their time and suggestions.</p>
</ack><sec sec-type="supplementary-material" id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fmed.2021.775047/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fmed.2021.775047/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="SM1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_2.DOCX" id="SM2" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Data_Sheet_3.DOCX" id="SM3" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/></sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Coopersmith</surname> <given-names>CM</given-names></name> <name><surname>De Backer</surname> <given-names>D</given-names></name> <name><surname>Deutschman</surname> <given-names>CS</given-names></name> <name><surname>Ferrer</surname> <given-names>R</given-names></name> <name><surname>Lat</surname> <given-names>I</given-names></name> <name><surname>Machado</surname> <given-names>FR</given-names></name> <etal/></person-group>. <article-title>Surviving sepsis campaign: research priorities for sepsis and septic shock</article-title>. <source>Intensive Care Med.</source> (<year>2018</year>) <volume>44</volume>:<fpage>1400</fpage>&#x02013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1007/s00134-018-5175-z</pub-id><pub-id pub-id-type="pmid">29971592</pub-id></citation></ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Prescott</surname> <given-names>HC</given-names></name> <name><surname>Angus</surname> <given-names>DC</given-names></name></person-group>. <article-title>Enhancing recovery from sepsis: a review</article-title>. <source>JAMA</source>. (<year>2018</year>) <volume>319</volume>: <fpage>62</fpage>&#x02013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1001/jama.2017.17687</pub-id><pub-id pub-id-type="pmid">29297082</pub-id></citation></ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levi</surname> <given-names>M</given-names></name> <name><surname>van der Poll</surname> <given-names>T</given-names></name></person-group>. <article-title>Coagulation and sepsis</article-title>. <source>Thromb Res.</source> (<year>2017</year>) <volume>149</volume>:<fpage>38</fpage>&#x02013;<lpage>44</lpage>. <pub-id pub-id-type="doi">10.1016/j.thromres.2016.11.007</pub-id><pub-id pub-id-type="pmid">27886531</pub-id></citation></ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iba</surname> <given-names>T</given-names></name> <name><surname>Umemura</surname> <given-names>Y</given-names></name> <name><surname>Watanabe</surname> <given-names>E</given-names></name> <name><surname>Wada</surname> <given-names>T</given-names></name> <name><surname>Hayashida</surname> <given-names>K</given-names></name> <name><surname>Kushimoto</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Diagnosis of sepsis-induced disseminated intravascular coagulation and coagulopathy</article-title>. <source>Acute Med Surg.</source> (<year>2019</year>) <volume>6</volume>:<fpage>223</fpage>&#x02013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1002/ams2.411</pub-id><pub-id pub-id-type="pmid">31410983</pub-id></citation></ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Voves</surname> <given-names>C</given-names></name> <name><surname>Wuillemin</surname> <given-names>WA</given-names></name> <name><surname>Zeerleder</surname> <given-names>S</given-names></name></person-group>. <article-title>International Society on Thrombosis and Haemostasis score for overt disseminated intravascular coagulation predicts organ dysfunction and fatality in sepsis patients</article-title>. <source>Blood Coagul Fibrin.</source> (<year>2006</year>) <volume>17</volume>:<fpage>445</fpage>&#x02013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1097/01.mbc.0000240916.63521.2e</pub-id><pub-id pub-id-type="pmid">16905947</pub-id></citation></ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lyons</surname> <given-names>PG</given-names></name> <name><surname>Micek</surname> <given-names>ST</given-names></name> <name><surname>Hampton</surname> <given-names>N</given-names></name> <name><surname>Kollef</surname> <given-names>MH</given-names></name></person-group>. <article-title>Sepsis-associated coagulopathy severity predicts hospital mortality</article-title>. <source>Crit Care Med.</source> (<year>2018</year>) <volume>46</volume>:<fpage>736</fpage>&#x02013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1097/CCM.0000000000002997</pub-id><pub-id pub-id-type="pmid">29373360</pub-id></citation></ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iba</surname> <given-names>T</given-names></name> <name><surname>Nisio</surname> <given-names>MD</given-names></name> <name><surname>Levy</surname> <given-names>JH</given-names></name> <name><surname>Kitamura</surname> <given-names>N</given-names></name> <name><surname>Thachil</surname> <given-names>J</given-names></name></person-group>. <article-title>New criteria for sepsis-induced coagulopathy (SIC) following the revised sepsis definition: a retrospective analysis of a nationwide survey</article-title>. <source>BMJ Open.</source> (<year>2017</year>) <volume>7</volume>:<fpage>e017046</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2017-017046</pub-id><pub-id pub-id-type="pmid">28963294</pub-id></citation></ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iba</surname> <given-names>T</given-names></name> <name><surname>Arakawa</surname> <given-names>M</given-names></name> <name><surname>Di Nisio</surname> <given-names>M</given-names></name> <name><surname>Gando</surname> <given-names>S</given-names></name> <name><surname>Anan</surname> <given-names>H</given-names></name> <name><surname>Sato</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Newly proposed sepsis-induced coagulopathy precedes international society on thrombosis and haemostasis overt-disseminated intravascular coagulation and predicts high mortality</article-title>. <source>J Intensive Care Med.</source> (<year>2020</year>) <volume>35</volume>:<fpage>643</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1177/0885066618773679</pub-id><pub-id pub-id-type="pmid">29720054</pub-id></citation></ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gando</surname> <given-names>S</given-names></name> <name><surname>Levi</surname> <given-names>M</given-names></name> <name><surname>Toh</surname> <given-names>CH</given-names></name></person-group>. <article-title>Disseminated intravascular coagulation</article-title>. <source>Nat Rev Dis Primers.</source> (<year>2016</year>) <volume>2</volume>:<fpage>16037</fpage>. <pub-id pub-id-type="doi">10.1038/nrdp.2016.37</pub-id><pub-id pub-id-type="pmid">27250996</pub-id></citation></ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Umemura</surname> <given-names>Y</given-names></name> <name><surname>Yamakawa</surname> <given-names>K</given-names></name> <name><surname>Ogura</surname> <given-names>H</given-names></name> <name><surname>Yuhara</surname> <given-names>H</given-names></name> <name><surname>Fujimi</surname> <given-names>S</given-names></name></person-group>. <article-title>Efficacy and safety of anticoagulant therapy in three specific populations with sepsis: a meta-analysis of randomized controlled trials</article-title>. <source>J Thromb Haemost.</source> (<year>2016</year>) <volume>14</volume>:<fpage>518</fpage>&#x02013;<lpage>30</lpage>. <pub-id pub-id-type="doi">10.1111/jth.13230</pub-id><pub-id pub-id-type="pmid">27537607</pub-id></citation></ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Umemura</surname> <given-names>Y</given-names></name> <name><surname>Yamakawa</surname> <given-names>K</given-names></name></person-group>. <article-title>Optimal patient selection for anticoagulant therapy in sepsis: an evidence-based proposal from Japan</article-title>. <source>J Thromb Haemost.</source> (<year>2018</year>) <volume>16</volume>:<fpage>462</fpage>&#x02013;<lpage>4</lpage>. <pub-id pub-id-type="doi">10.1111/jth.13946</pub-id><pub-id pub-id-type="pmid">29316171</pub-id></citation></ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Iba</surname> <given-names>T</given-names></name> <name><surname>Levy</surname> <given-names>JH</given-names></name> <name><surname>Warkentin</surname> <given-names>TE</given-names></name> <name><surname>Thachil</surname> <given-names>J</given-names></name> <name><surname>van der Poll</surname> <given-names>T</given-names></name> <name><surname>Levi</surname> <given-names>M</given-names></name></person-group>. <article-title>Diagnosis and management of sepsis-induced coagulopathy and disseminated intravascular coagulation</article-title>. <source>J Thromb Haemost.</source> (<year>2019</year>) <volume>17</volume>:<fpage>1989</fpage>&#x02013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1111/jth.14578</pub-id><pub-id pub-id-type="pmid">31410983</pub-id></citation></ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ngiam</surname> <given-names>KY</given-names></name> <name><surname>Khor</surname> <given-names>IW</given-names></name></person-group>. <article-title>Big data and machine learning algorithms for health-care delivery</article-title>. <source>Lancet Oncol.</source> (<year>2019</year>) <volume>20</volume>:<fpage>e262</fpage>&#x02013;<lpage>73</lpage>. <pub-id pub-id-type="doi">10.1016/S1470-2045(19)30149-4</pub-id><pub-id pub-id-type="pmid">31044724</pub-id></citation></ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jiang</surname> <given-names>F</given-names></name> <name><surname>Jiang</surname> <given-names>Y</given-names></name> <name><surname>Zhi</surname> <given-names>H</given-names></name> <name><surname>Dong</surname> <given-names>Y</given-names></name> <name><surname>Li</surname> <given-names>H</given-names></name> <name><surname>Ma</surname> <given-names>S</given-names></name> <etal/></person-group>. <article-title>Artificial intelligence in healthcare: past, present and future</article-title>. <source>Stroke Vasc Neurol.</source> (<year>2017</year>) <volume>2</volume>:<fpage>230</fpage>&#x02013;<lpage>43</lpage>. <pub-id pub-id-type="doi">10.1136/svn-2017-000101</pub-id><pub-id pub-id-type="pmid">31670713</pub-id></citation></ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Harerimana</surname> <given-names>G</given-names></name> <name><surname>Kim</surname> <given-names>JW</given-names></name> <name><surname>Yoo</surname> <given-names>H</given-names></name> <name><surname>Jang</surname> <given-names>B</given-names></name></person-group>. <article-title>Deep learning for electronic health records analytics</article-title>. <source>IEEE Access.</source> (<year>2019</year>) <volume>7</volume>:<fpage>101245</fpage>&#x02013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.1109/access.2019.2928363</pub-id><pub-id pub-id-type="pmid">33182703</pub-id></citation></ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fleuren</surname> <given-names>LM</given-names></name> <name><surname>Klausch</surname> <given-names>TLT</given-names></name> <name><surname>Zwager</surname> <given-names>CL</given-names></name> <name><surname>Schoonmade</surname> <given-names>LJ</given-names></name> <name><surname>Guo</surname> <given-names>T</given-names></name> <name><surname>Roggeveen</surname> <given-names>LF</given-names></name> <etal/></person-group>. <article-title>Machine learning for the prediction of sepsis: a systematic review and meta-analysis of diagnostic test accuracy</article-title>. <source>Intensive Care Med.</source> (<year>2020</year>) <volume>46</volume>:<fpage>383</fpage>&#x02013;<lpage>400</lpage>. <pub-id pub-id-type="doi">10.1007/s00134-019-05872-y</pub-id><pub-id pub-id-type="pmid">31965266</pub-id></citation></ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Holzinger</surname> <given-names>A</given-names></name> <name><surname>Jurisica</surname> <given-names>I</given-names></name></person-group>. <article-title>Knowledge discovery and data mining in biomedical informatics: the future is in integrative, interactive machine learning solutions</article-title>: In: <person-group person-group-type="editor"><name><surname>Holzinger</surname> <given-names>A</given-names></name> <name><surname>Jurisica</surname> <given-names>I</given-names></name></person-group> editors. <source>Interactive Knowledge Discovery and Data Mining in Biomedical Informatics. Lecture Notes in Computer Science</source>, Vol. <volume>8401</volume>. <publisher-loc>Berlin; Heidelberg</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2014</year>). p. <fpage>1</fpage>&#x02013;<lpage>18</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-662-43968-5_1</pub-id></citation>
</ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>TQ</given-names></name> <name><surname>Guestrin</surname> <given-names>C</given-names></name> <name><surname>Assoc Comp</surname> <given-names>M</given-names></name></person-group>. <article-title>XGBoost: a scalable tree boosting system</article-title>. In: <source>Kdd&#x00027;16: Proceedings of the 22nd Acm Sigkdd International Conference on Knowledge Discovery and Data Mining</source>. <publisher-loc>San Francisco, CA</publisher-loc> (<year>2016</year>). p. <fpage>785</fpage>&#x02013;<lpage>94</lpage>. <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id><pub-id pub-id-type="pmid">32561836</pub-id></citation></ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>J</given-names></name> <name><surname>Zhang</surname> <given-names>L</given-names></name> <name><surname>Guo</surname> <given-names>Q</given-names></name> <name><surname>Yi</surname> <given-names>Z</given-names></name></person-group>. <article-title>Recurrent neural networks with auxiliary memory units</article-title>. <source>IEEE Trans Neural Netw Learn Syst.</source> (<year>2017</year>) <volume>29</volume>:<fpage>1652</fpage>&#x02013;<lpage>61</lpage>. <pub-id pub-id-type="doi">10.1109/TNNLS.2017.2677968</pub-id><pub-id pub-id-type="pmid">28333646</pub-id></citation></ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Futoma</surname> <given-names>J</given-names></name> <name><surname>Hariharan</surname> <given-names>S</given-names></name> <name><surname>Heller</surname> <given-names>K</given-names></name></person-group>. <article-title>Learning to detect sepsis with a multitask gaussian process RNN classifier.</article-title> In: <person-group person-group-type="editor"><name><surname>Doina</surname> <given-names>P</given-names></name> <name><surname>Yee Whye</surname> <given-names>T</given-names></name></person-group> editors. <source>Proceedings of the 34th International Conference on Machine Learning.</source> Vol. <volume>70</volume>. <publisher-loc>Proceedings of Machine Learning Research</publisher-loc>: <publisher-name>PMLR. Sydney, NSW</publisher-name> (<year>2017</year>). p. <fpage>1174</fpage>&#x02013;<lpage>82</lpage>.</citation>
</ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Che</surname> <given-names>Z</given-names></name> <name><surname>Purushotham</surname> <given-names>S</given-names></name> <name><surname>Cho</surname> <given-names>K</given-names></name> <name><surname>Sontag</surname> <given-names>D</given-names></name> <name><surname>Liu</surname> <given-names>Y</given-names></name></person-group>. <article-title>Recurrent neural networks for multivariate time series with missing values</article-title>. <source>Sci Rep.</source> (<year>2018</year>) <volume>8</volume>:<fpage>6085</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-24271-9</pub-id><pub-id pub-id-type="pmid">29666385</pub-id></citation></ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Johnson</surname> <given-names>AE</given-names></name> <name><surname>Pollard</surname> <given-names>TJ</given-names></name> <name><surname>Shen</surname> <given-names>L</given-names></name> <name><surname>Lehman</surname> <given-names>LW</given-names></name> <name><surname>Feng</surname> <given-names>M</given-names></name> <name><surname>Ghassemi</surname> <given-names>M</given-names></name> <etal/></person-group>. <article-title>MIMIC-III, a freely accessible critical care database</article-title>. <source>Sci Data.</source> (<year>2016</year>) <volume>3</volume>:<fpage>160035</fpage>. <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id><pub-id pub-id-type="pmid">27219127</pub-id></citation></ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Rubanova</surname> <given-names>Y</given-names></name> <name><surname>Chen</surname> <given-names>RTQ</given-names></name> <name><surname>Duvenaud</surname> <given-names>D</given-names></name></person-group>. <article-title>Latent ODEs for irregularly-sampled time series</article-title>. In: <source>Advances in Neural Information Processing Systems 32 (Nips 2019).</source> Vol. <volume>32</volume>. <publisher-loc>Vancouver, BC</publisher-loc> (<year>2019</year>).</citation>
</ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Christensen</surname> <given-names>R</given-names></name></person-group>. <article-title>Linear and log-linear models</article-title>. <source>J Am Stat Assoc.</source> (<year>2000</year>) <volume>95</volume>:<fpage>1290</fpage>&#x02013;<lpage>3</lpage>. <pub-id pub-id-type="doi">10.1080/01621459.2000.10474332</pub-id></citation>
</ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Noble</surname> <given-names>WS</given-names></name></person-group>. <article-title>What is a support vector machine?</article-title> <source>Nat Biotechnol.</source> (<year>2006</year>) <volume>24</volume>:<fpage>1565</fpage>&#x02013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1038/nbt1206-1565</pub-id><pub-id pub-id-type="pmid">17160063</pub-id></citation></ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Ke</surname> <given-names>GL</given-names></name> <name><surname>Meng</surname> <given-names>Q</given-names></name> <name><surname>Finley</surname> <given-names>T</given-names></name> <name><surname>Wang</surname> <given-names>TF</given-names></name> <name><surname>Chen</surname> <given-names>W</given-names></name> <name><surname>Ma</surname> <given-names>WD</given-names></name> <etal/></person-group>. <article-title>LightGBM: a highly efficient gradient boosting decision tree.</article-title> In: <person-group person-group-type="editor"><name><surname>Guyon</surname> <given-names>I</given-names></name> <name><surname>Luxburg</surname> <given-names>UV</given-names></name> <name><surname>Bengio</surname> <given-names>S</given-names></name> <name><surname>Wallach</surname> <given-names>H</given-names></name> <name><surname>Fergus</surname> <given-names>R</given-names></name> <name><surname>Vishwanathan</surname> <given-names>S</given-names></name> <name><surname>Garnett</surname> <given-names>R</given-names></name></person-group>. <source>Advances in Neural Information Processing Systems 30,</source> Vol. <volume>30</volume>. <publisher-loc>Long Beach, CA</publisher-loc> (<year>2017</year>).</citation>
</ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sagi</surname> <given-names>O</given-names></name> <name><surname>Rokach</surname> <given-names>L</given-names></name></person-group>. <article-title>Approximating XGBoost with an interpretable decision tree</article-title>. <source>Inf Sci.</source> (<year>2021</year>) <volume>572</volume>:<fpage>522</fpage>&#x02013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.1016/j.ins.2021.05.055</pub-id></citation>
</ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>Y</given-names></name> <name><surname>Si</surname> <given-names>X</given-names></name> <name><surname>Hu</surname> <given-names>C</given-names></name> <name><surname>Zhang</surname> <given-names>J</given-names></name></person-group>. <article-title>A review of recurrent neural networks: LSTM cells and network architectures</article-title>. <source>Neural Comput.</source> (<year>2019</year>) <volume>31</volume>:<fpage>1235</fpage>&#x02013;<lpage>70</lpage>. <pub-id pub-id-type="doi">10.1162/neco_a_01199</pub-id><pub-id pub-id-type="pmid">31113301</pub-id></citation></ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Lundberg</surname> <given-names>SM</given-names></name> <name><surname>Lee</surname> <given-names>SI</given-names></name></person-group>. <article-title>A unified approach to interpreting model predictions</article-title>. In: <source>Advances in Neural Information Processing Systems 30 (Nips 2017).</source> Vol. <volume>30</volume>. <publisher-loc>Long Beach, CA</publisher-loc> (<year>2017</year>). p. <fpage>4768</fpage>&#x02013;<lpage>777</lpage>.</citation>
</ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Zeiler</surname> <given-names>MD</given-names></name> <name><surname>Fergus</surname> <given-names>R</given-names></name></person-group>. <article-title>Visualizing and understanding convolutional networks</article-title>. In: <source>European Conference on Computer Vision</source>. <publisher-loc>Zurich</publisher-loc>: <publisher-name>Springer</publisher-name> (<year>2014</year>). p. <fpage>818</fpage>&#x02013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-319-10590-1_53</pub-id></citation>
</ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Favaloro</surname> <given-names>EJ</given-names></name> <name><surname>Negrini</surname> <given-names>D</given-names></name></person-group>. <article-title>Machine learning and coagulation testing: the next big thing in hemostasis investigations?</article-title> <source>Clin Chem Lab Med.</source> (<year>2021</year>) <volume>59</volume>:<fpage>1177</fpage>&#x02013;<lpage>9</lpage>. <pub-id pub-id-type="doi">10.1515/cclm-2021-0216</pub-id><pub-id pub-id-type="pmid">33660488</pub-id></citation></ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hasegawa</surname> <given-names>D</given-names></name> <name><surname>Yamakawa</surname> <given-names>K</given-names></name> <name><surname>Nishida</surname> <given-names>K</given-names></name> <name><surname>Okada</surname> <given-names>N</given-names></name> <name><surname>Murao</surname> <given-names>S</given-names></name> <name><surname>Nishida</surname> <given-names>O</given-names></name></person-group>. <article-title>Comparative analysis of three machine-learning techniques and conventional techniques for predicting sepsis-induced coagulopathy progression</article-title>. <source>J Clin Med.</source> (<year>2020</year>) <volume>9</volume>:<fpage>2113</fpage>. <pub-id pub-id-type="doi">10.3390/jcm9072113</pub-id><pub-id pub-id-type="pmid">32635574</pub-id></citation></ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shickel</surname> <given-names>B</given-names></name> <name><surname>Tighe</surname> <given-names>PJ</given-names></name> <name><surname>Bihorac</surname> <given-names>A</given-names></name> <name><surname>Rashidi</surname> <given-names>P</given-names></name></person-group>. <article-title>Deep EHR: a survey of recent advances in deep learning techniques for electronic health record (EHR) analysis</article-title>. <source>IEEE J Biomed Health Inform.</source> (<year>2017</year>) <volume>22</volume>:<fpage>1589</fpage>&#x02013;<lpage>604</lpage>. <pub-id pub-id-type="doi">10.1109/JBHI.2017.2767063</pub-id><pub-id pub-id-type="pmid">29989977</pub-id></citation></ref>
<ref id="B34">
<label>34.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>RTQ</given-names></name> <name><surname>Rubanova</surname> <given-names>Y</given-names></name> <name><surname>Bettencourt</surname> <given-names>J</given-names></name> <name><surname>Duvenaud</surname> <given-names>D</given-names></name></person-group>. <article-title>Neural ordinary differential equations</article-title>. In: <source>Advances in Neural Information Processing Systems 31 (Nips 2018).</source> Vol. <volume>31</volume>. <publisher-loc>Montr&#x000E9;al, QC</publisher-loc> (<year>2018</year>).</citation>
</ref>
<ref id="B35">
<label>35.</label>
<citation citation-type="journal"><person-group person-group-type="author"><name><surname>Alber</surname> <given-names>M</given-names></name> <name><surname>Buganza Tepole</surname> <given-names>A</given-names></name> <name><surname>Cannon WR De</surname> <given-names>S</given-names></name> <name><surname>Dura-Bernal</surname> <given-names>S</given-names></name> <name><surname>Garikipati</surname> <given-names>K</given-names></name> <etal/></person-group>. <article-title>Integrating machine learning and multiscale modeling-perspectives, challenges, and opportunities in the biological, biomedical, and behavioral sciences</article-title>. <source>NPJ Digit Med.</source> (<year>2019</year>) <volume>2</volume>:<fpage>115</fpage>. <pub-id pub-id-type="doi">10.1038/s41746-019-0193-y</pub-id><pub-id pub-id-type="pmid">31799423</pub-id></citation></ref>
<ref id="B36">
<label>36.</label>
<citation citation-type="book"><person-group person-group-type="author"><name><surname>Qin</surname> <given-names>Z</given-names></name> <name><surname>Yan</surname> <given-names>L</given-names></name> <name><surname>Zhuang</surname> <given-names>H</given-names></name> <name><surname>Tay</surname> <given-names>Y</given-names></name> <name><surname>Pasumarthi</surname> <given-names>RK</given-names></name> <name><surname>Wang</surname> <given-names>X</given-names></name> <etal/></person-group>. <article-title>Are neural rankers still outperformed by gradient boosted decision trees?</article-title> In: <source>International Conference on Learning Representations (ICLR 2021)</source>. <publisher-loc>Vienna</publisher-loc> (<year>2021</year>).</citation>
</ref>
</ref-list>
</back>
</article>