<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">610197</article-id>
<article-id pub-id-type="doi">10.3389/frai.2021.610197</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Methods</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>An Explainable Multimodal Neural Network Architecture for Predicting Epilepsy Comorbidities Based on Administrative Claims Data</article-title>
<alt-title alt-title-type="left-running-head">Linden et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">An Explainable Multimodal Neural Network</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Linden</surname>
<given-names>Thomas</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1096480/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>De Jong</surname>
<given-names>Johann</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Lu</surname>
<given-names>Chao</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Kiri</surname>
<given-names>Victor</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Haeffs</surname>
<given-names>Kathrin</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1099489/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Fr&#xf6;hlich</surname>
<given-names>Holger</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/285008/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Department of Bioinformatics, Fraunhofer Institute for Algorithms and Scientific Computing (SCAI), Schloss Birlinghoven, <addr-line>Sankt Augustin</addr-line>, <country>Germany</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Bonn-Aachen International Center for Information Technology (B-IT), University of Bonn, <addr-line>Bonn</addr-line>, <country>Germany</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>UCB Biosciences GmbH, <addr-line>Monheim</addr-line>, <country>Germany</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>UCB Ltd., <addr-line>Raleigh</addr-line>, <addr-line>NC</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/62746/overview">Enrico Capobianco</ext-link>, University of Miami, United&#x20;States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/531819/overview">Rimpi Khurana</ext-link>, University of Miami Miller School of Medicine, United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/12494/overview">Thomas Hartung</ext-link>, Johns Hopkins University, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Holger Fr&#xf6;hlich, <email>holger.froehlich@scai.fraunhofer.de</email>
</corresp>
<fn fn-type="equal" id="fn1-1">
<label>
<sup>&#x2020;</sup>
</label>
<p>Surname changed from Gerlach to Linden in&#x20;2018</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Medicine and Public Health, a section of the journal Frontiers in Artificial Intelligence</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>21</day>
<month>05</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>4</volume>
<elocation-id>610197</elocation-id>
<history>
<date date-type="received">
<day>25</day>
<month>09</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>21</day>
<month>04</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Linden, De Jong, Lu, Kiri, Haeffs and Fr&#xf6;hlich.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Linden, De Jong, Lu, Kiri, Haeffs and Fr&#xf6;hlich</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>Epilepsy is a complex brain disorder characterized by repetitive seizure events. Epilepsy patients often suffer from various and severe physical and psychological comorbidities (e.g., anxiety, migraine, and stroke). While general comorbidity prevalences and incidences can be estimated from epidemiological data, such an approach does not take into account that actual patient-specific risks can depend on various individual factors, including medication. This motivates to develop a machine learning approach for predicting risks of future comorbidities for individual epilepsy patients. In this work, we use inpatient and outpatient administrative health claims data of around 19,500 U.S. epilepsy patients. We suggest a dedicated multimodal neural network architecture (Deep personalized LOngitudinal convolutional RIsk model&#x2014;DeepLORI) to predict the time-dependent risk of six common comorbidities of epilepsy patients. We demonstrate superior performance of DeepLORI in a comparison with several existing methods. Moreover, we show that DeepLORI-based predictions can be interpreted on the level of individual patients. Using a game theoretic approach, we identify relevant features in DeepLORI models and demonstrate that model predictions are explainable in light of existing knowledge about the disease. Finally, we validate the model on independent data from around 97,000 patients, showing good generalization and stable prediction performance over&#x20;time.</p>
</abstract>
<kwd-group>
<kwd>precision medicine</kwd>
<kwd>personalized medicine</kwd>
<kwd>P4 medicine</kwd>
<kwd>comorbidity prediction</kwd>
<kwd>administrative claims data</kwd>
<kwd>epilepsy</kwd>
<kwd>neural networks</kwd>
<kwd>machine learning</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Epilepsy is a complex, life-threatening brain disorder characterized by repetitive seizure events. Epilepsy patients often suffer from various and severe physical and psychological comorbidities, such as overweight and obesity, anxiety, migraine, bipolar disorder, and cardiovascular diseases (<xref ref-type="bibr" rid="B44">Seidenberg et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B34">Ottman et&#x20;al., 2011</xref>; <xref ref-type="bibr" rid="B24">Keezer et&#x20;al., 2016</xref>). Some comorbidities confer a poor disease prognosis because they complicate pharmacological treatment owing to possible drug&#x2013;drug interactions and adverse events (<xref ref-type="bibr" rid="B53">Verrotti and Mazzocchetti, 2016</xref>). The actual development of comorbidities is dependent on patient-specific factors and may be modulated by antiepileptic drug (AED) treatment (<xref ref-type="bibr" rid="B58">Zaccara, 2009</xref>). Early identification and treatment of comorbidities has thus been identified as highly relevant to improve the quality of life of epilepsy patients (<xref ref-type="bibr" rid="B53">Verrotti and Mazzocchetti, 2016</xref>). However, there is a high subject-to-subject variability. Methods from the field of artificial intelligence (AI), and more specifically machine learning (ML), have the potential to predict comorbidity risks on an individual subject basis, hence fulfilling one of the promises of a more individualized patient care in the sense of precision medicine. More specifically, ML-based approaches can be used to aid disease prevention by predicting the time-dependent risk of an individual epilepsy patient to develop several common comorbidities in the future, such as 1) anxiety, 2) bipolar disorder and schizophrenia, 3) diabetes type 2, 4) migraine, 5) overweight and obesity, and 6) stroke and ischemic attacks.</p>
<p>Machine learning models to predict individualized comorbidity risks of diseases different from epilepsy have recently been published (e.g., <xref ref-type="bibr" rid="B11">Dworzynski et&#x20;al. (2020)</xref> and <xref ref-type="bibr" rid="B32">Noh et&#x20;al. (2020)</xref>) using clinical routine data from the Danish national registry and hospital electronic health records, respectively. For epilepsy, <xref ref-type="bibr" rid="B15">Glauser et&#x20;al. (2020</xref>) proposed an ML model for psychiatric comorbidities based on survey data from 122 patients. In our earlier work (<xref ref-type="bibr" rid="B14">Gerlach et&#x20;al., 2017</xref>), we proposed an ML model (random survival forests) using U.S. administrative health claims data from &#x223c;10,000 epilepsy patients to predict several major comorbidities (anxiety, bipolar disorder and schizophrenia, diabetes type 2, migraine, overweight and obesity, and stroke and ischemic attacks) of epilepsy patients.</p>
<p>Administrative health claims data have generally been shown useful for developing ML models in the epilepsy field. For example, <xref ref-type="bibr" rid="B1">An et&#x20;al. (2018)</xref> used claims data of more than 1.3 million epilepsy patients to predict antiepileptic drug resistance. Examples from other disease areas include prediction of Alzheimer&#x2019;s disease (<xref ref-type="bibr" rid="B35">Park et&#x20;al., 2020</xref>), osteoporotic hip fractures (<xref ref-type="bibr" rid="B12">Engels et&#x20;al., 2020</xref>), and heart failure (<xref ref-type="bibr" rid="B9">Desai et&#x20;al., 2020</xref>). The opportunities of healthcare claims data for ML-based modeling have further been discussed in (<xref ref-type="bibr" rid="B13">Fr&#xf6;hlich et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B31">Miotto et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B57">Xiao et&#x20;al, 2018</xref>; <xref ref-type="bibr" rid="B49">Thesmar et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B25">Kwak and Hui, 2020</xref>).</p>
<p>In our earlier work, we demonstrated the possibility to augment claims data with biomedical background knowledge, hence enabling the interpretation of machine learning models down to the level of disease-associated biological processes (<xref ref-type="bibr" rid="B14">Gerlach et&#x20;al., 2017</xref>). The particular novelty of the present work is a dedicated multimodal neural network architecture for administrative claims data, which we call Deep personalized LOngitudinal convolutional RIsk model (DeepLORI). We show that DeepLORI more accurately predicts the time-dependent risk for six common comorbidities on the level of individual patients than several competing methods, including our own previously proposed model. Using a game theoretic approach based on Shapley Additive Explanations (<xref ref-type="bibr" rid="B27">Lundberg and Lee, 2017</xref>), we show that DeepLORI models are explainable, also on the level of predictions for individual patients.</p>
</sec>
<sec id="s2">
<title>Data</title>
<sec id="s2-1">
<title>Claims-Based Electronic Health Records</title>
<p>U.S. commercial inpatient and outpatient data were obtained from IBM&#xae; MarketScan&#xae; Truven Health databases. The Commercial Claims and Encounters database within MarketScan&#xae; is a nationally representative collection of de-identified patient-specific inpatient, outpatient, and pharmaceutical claims from more than 200 insurance carriers and large, self-insuring companies. All dates and time stamps were transformed from a daily to a monthly scale (1&#xa0;month &#x3d; 30&#xa0;days) for a more robust representation. The data generally comprise demographic (age, gender) and regional information (major metropolitan area), days in hospital, health insurance plan, and time-dependent diagnosis codes and prescriptions (plus prescription duration and quantity).</p>
<p>We used two cohorts: 1) the original data covering years 2011&#x2013;2015 for model training and evaluation within a nested cross-validation scheme, and 2) the external validation data covering years 2008&#x2013;2018 to validate the models trained on the &#x201c;original data.&#x201d; In agreement to our earlier publication (<xref ref-type="bibr" rid="B14">Gerlach et&#x20;al., 2017</xref>) and common practice at UCB, epilepsy patients in the original data were identified matching at least one of the following criteria:<list list-type="simple">
<list-item>
<p>(1) An occurrence of &#x2265; 2 ICD-9-CM codes of 345.xx (i.e.,&#x20;epilepsy, except 345.3&#x2014;grand mal status) among separate medical encounters (separate dates in any care venue)</p>
</list-item>
<list-item>
<p>(2) An occurrence of &#x2265;1 ICD-9-CM code of 345.xx (except for 345.3) AND &#x2265;1 ICD-9-CM code of 780.39 (convulsions) among separate medical encounters</p>
</list-item>
<list-item>
<p>(3) An occurrence of 1 ICD-9-CM code of 345.xx (except for 345.3) and code(s) for AED prescription at least a day after the 345.xx&#x20;code</p>
</list-item>
<list-item>
<p>(4) An occurrence of &#x2265;2 ICD codes of 780.39 among separate medical encounters and code(s) for AED treatment. The code(s) for the AED treatment should occur at least a day after the second 780.39 irrespective of the presence or absence of an AED code after the first 780.39&#x20;code</p>
</list-item>
<list-item>
<p>(5) Individuals with ICD-9-CM code 345.3 will be required to have an occurrence of &#x2265;2 ICD-9-CM codes of 345.3 separated by at least 30&#xa0;days, or an occurrence of the 345.3 code and &#x2265;1 ICD-9-CM code 780.39 separated by at least 30&#xa0;days, or &#x2265;1 ICD-9-CM code 345.3 and &#x2265;1 ICD-9-CM code 345.xx encounters on separate&#x20;days</p>
</list-item>
</list>
</p>
<p>The index date for each patient was defined as the time point of the first epilepsy diagnosis, and for definitions requiring at least 2 ICD-9-CM codes, the first diagnosis code was the index date. The data were further filtered by requiring for each patient 1) at least 365&#xb0;days of medical history before, and 365-day follow-up after the index date; 2) age between 18 and 65&#x20;years; 3) any AED treatment during the observation period. Altogether this yielded 7,430,840 records from 19,510 patients. More details about the filtering process can be found in the <xref ref-type="sec" rid="s11">Supplementary Material</xref> of this article. For part of these patients, diagnoses after the index date were coded in ICD10, which we mapped to ICD-9-CM via the Thomas Reuters<sup>TM</sup> public Web resource<xref ref-type="fn" rid="fn1">
<sup>1</sup>
</xref> and manual curation.</p>
<p>Note that in medical practice, confirmation of the final diagnosis &#x201c;epilepsy&#x201d; can be complicated and often requires a number of visits. Moreover, reporting of a dedicated diagnosis within our data does not necessarily correspond to the actual time point of the medical condition within the patient. To capture this uncertainty, we defined a three-month time interval starting from the index date as the &#x201c;epilepsy diagnosis period&#x201d;. That means the actual medical history of each patient after application of the abovementioned filter criteria was 365&#x20;&#x2b; 91&#xb0;days, that is, 456&#xb0;days.</p>
<p>Diagnosis codes after 1st Oct 2015 were provided as ICD-10-CM codes. Accordingly, the following modified inclusion criteria were applied to select epilepsy patients in the external validation data (covering 2008&#x2013;2018):<list list-type="simple">
<list-item>
<p>(1) The presence of at least 1 ICD-9-CM of 345.xx or ICD-10-CM of G40.xx (epilepsy)</p>
</list-item>
<list-item>
<p>(2) The presence of at least 2 ICD-9-CM of 780.39 or ICD-10-CM of R56.9 (convulsions) within one&#x20;year.</p>
</list-item>
</list>
</p>
<p>After applying the same filter criteria as for the original data, this resulted in 112,755 patients. Within those patients, we pre-filtered diagnosis codes and substances observed in <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>10</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula> patients or with a frequency &#x2264;1%. One of the main issues with claims data is that one and the same diagnosis may be coded with different ICD codes. Moreover, observations related to one specific ICD9/10 code could be rare. To address these issues, we mapped all ICD-9-CM codes to PheWAS terms, which describe a higher level aggregate of several ICD codes (<xref ref-type="bibr" rid="B5">Carroll et&#x20;al., 2014</xref>). In addition, a mapping to MeSH (<xref ref-type="bibr" rid="B40">Rogers, 1963</xref>) was performed to allow for integration with other data sources (see <italic>Methods</italic>).</p>
</sec>
<sec id="s2-2">
<title>Definition of Focused Comorbidities and Compilation of Training Data</title>
<p>Based on the medical literature and observed frequency in our data, we focused on six common comorbidities of epilepsy patients: 1) anxiety, 2) bipolar and schizophrenia, 3) diabetes type 2, 4) migraine, 5) overweight and obesity, and 6) stroke and ischemic attack. These comorbidities were defined according to a set of PheWAS codes provided in the supplements (<xref ref-type="sec" rid="s11">Supplementary Table&#x20;S1</xref>).</p>
<p>The number of patients with these comorbidities being diagnosed at least 6&#x20;months after the epilepsy diagnosis period differs widely across comorbidities (<xref ref-type="table" rid="T1">Table&#x20;1</xref>). We would like to highlight that our data are in principle right-censored, that is, the diagnosis of a specific comorbidity might happen after the end of the period covered by our training data. Moreover, a significant proportion of those individuals where a diagnosis of a specific comorbidity is observed (i.e.,&#x20;incident cases) have already been diagnosed with at least one of the other 5 comorbidities during their medical history (<xref ref-type="table" rid="T1">Table&#x20;1</xref>). Note that for training a machine learning model to predict a specific comorbidity, we should not have an observation of the same comorbidity in the medical history of any of the training samples. For this reason, the number of patients in the training data is different per comorbidity, and we developed separate machine learning models for each comorbidity.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Proportion of incident patients by comorbidity.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Comorbidity</th>
<th align="center">
<italic>n</italic> total</th>
<th align="center">
<italic>n</italic> incident</th>
<th align="center">% Incident</th>
<th align="center">Mean&#x20;&#xb1; sd, no. of other comorbidities in medical history per incident patient</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Anxiety</td>
<td align="center">15,274</td>
<td align="center">4,037</td>
<td align="char" char=".">26%</td>
<td align="char" char="plusmn">1.3&#x20;&#xb1; 0.6</td>
</tr>
<tr>
<td align="left">Bipolar/Schizophrenia</td>
<td align="center">16,908</td>
<td align="center">1,279</td>
<td align="char" char=".">8%</td>
<td align="char" char="plusmn">1.5&#x20;&#xb1; 0.8</td>
</tr>
<tr>
<td align="left">Diabetes type 2</td>
<td align="center">16,929</td>
<td align="center">1,377</td>
<td align="char" char=".">8%</td>
<td align="char" char="plusmn">1.5&#x20;&#xb1; 0.8</td>
</tr>
<tr>
<td align="left">Migraine</td>
<td align="center">16,036</td>
<td align="center">2,063</td>
<td align="char" char=".">13%</td>
<td align="char" char="plusmn">1.3&#x20;&#xb1; 0.7</td>
</tr>
<tr>
<td align="left">Overweight/Obesity</td>
<td align="center">17,273</td>
<td align="center">3,307</td>
<td align="char" char=".">19%</td>
<td align="char" char="plusmn">1.4&#x20;&#xb1; 0.7</td>
</tr>
<tr>
<td align="left">Stroke/Ischemic Attack</td>
<td align="center">17,208</td>
<td align="center">1,157</td>
<td align="char" char=".">7%</td>
<td align="char" char="plusmn">1.5&#x20;&#xb1; 0.8</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Each diagnosis and prescription in our data has an associated time stamp. Due to the fact that the appearance of a record in our data does not necessarily correspond to the observation of the actual medical condition, each time stamp was mapped to a monthly (&#x3d; 30-day time interval) resolution.</p>
</sec>
</sec>
<sec sec-type="methods" id="s3">
<title>Methods</title>
<sec id="s3-1">
<title>Proposed Model: DeepLORI</title>
<sec id="s3-1-1">
<title>DeepLORI Architecture</title>
<p>As highlighted before, our aim was to develop separate machine learning models for each of six typical comorbidities of epilepsy patients. Each of these models aims for predicting the time-dependent risk of an individual to be diagnosed with one specific comorbidity.</p>
<p>We came up with a dedicated neural network model for our purposes, which we call Deep personalized LOngitudinal convolution RIsk model (DeepLORI). We start by explaining the principle architecture of DeepLORI. In agreement to our former work, one of the key ideas is that claims data have an inherent hierarchical structure (<xref ref-type="bibr" rid="B14">Gerlach et&#x20;al., 2017</xref>): The data initially contain three major types of features: 1) prescribed substance codes, 2) diagnoses codes (mapped to PheWAS terms, see above), and 3) general demographic information, such as age, gender, and major metropolitan area information. Monthly reported prescriptions and diagnoses can typically be represented via a one-hot vector encoding. However, individual substance and diagnose codes are typically, rather sparsely, observed over time, which can potentially lead to challenges for a machine learning algorithm to find regularities.</p>
<p>Based on this consideration, our idea was to use additional background knowledge available in databases to impose further hierarchical substructure: For example, each prescribed substance may have one or several known targets, and it can have a number of side effects reported in clinical studies. Diagnoses have associated symptoms, and in some cases, biomarkers may exist. Based on this background information, each domain of features (e.g., diagnosis) can be further associated to several subdomains (e.g., biomarkers and impaired biological pathways). Subdomain features can subsequently be represented via a one-hot vector encoding. <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>; <xref ref-type="table" rid="T2">Table&#x20;2</xref> provide an overview about the domains and corresponding subdomains we defined in our data. (More details about our previously published approach to augment claims data with biomedical knowledge can be found in the supplements.)</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Hierarchical data model structures the data in 3 input domains (general, drug, and diagnosis) and according subdomains. Features retrieved from the claims data are highlighted in red, and all others are augmented features (including those highlighted in blue).</p>
</caption>
<graphic xlink:href="frai-04-610197-g001.tif"/>
</fig>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Number of features by domain, subdomain, and feature origin (claims data or biomedical background knowledge).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Domain</th>
<th rowspan="2" align="center">Subdomain</th>
<th colspan="2" align="center">Feature origin</th>
<th rowspan="2" align="center">&#x23;Time-dependent features (per 30-day time interval)</th>
<th rowspan="2" align="center">&#x23;static features</th>
</tr>
<tr>
<th align="center">Claims data</th>
<th align="center">Background knowledge</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Diagnosis</td>
<td align="left">Biomarker</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">699</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Diagnosis</td>
<td align="left">GO term</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">3,759</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Diagnosis</td>
<td align="left">MeSH disease</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">137</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Diagnosis</td>
<td align="left">Pathway</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">453</td>
<td align="left"/>
</tr>
<tr>
<td align="left">
<bold>Diagnosis</bold>
</td>
<td align="left">
<bold>PheWAS</bold>
</td>
<td align="center">x</td>
<td align="left"/>
<td align="center">
<bold>1,196</bold>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Diagnosis</td>
<td align="left">Symptoms</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">235</td>
<td align="left"/>
</tr>
<tr>
<td align="left">
<bold>General</bold>
</td>
<td align="left">
<bold>Age, sex, insurance, hospital</bold>
</td>
<td align="center">x</td>
<td align="left"/>
<td align="left"/>
<td align="char" char=".">
<bold>17</bold>
</td>
</tr>
<tr>
<td align="left">General</td>
<td align="left">Medical risk</td>
<td align="left"/>
<td align="center">X</td>
<td align="left"/>
<td align="char" char=".">53</td>
</tr>
<tr>
<td align="left">
<bold>General</bold>
</td>
<td align="left">
<bold>Region</bold>
</td>
<td align="center">x</td>
<td align="left"/>
<td align="left"/>
<td align="char" char=".">
<bold>403</bold>
</td>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">GO term</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">1,240</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">Pathway</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">435</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">PheWAS (known indications)</td>
<td align="left"/>
<td align="center">X</td>
<td align="center">986</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">Side effects x frequency</td>
<td align="left"/>
<td align="center">x</td>
<td align="center">1,489</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">
<bold>Substance name</bold>
</td>
<td align="center">x</td>
<td align="left"/>
<td align="center">
<bold>453</bold>
</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">Target tissue</td>
<td align="left"/>
<td align="center">x</td>
<td align="center">32</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">Therapeutic class</td>
<td align="left"/>
<td align="center">x</td>
<td align="center">104</td>
<td align="left"/>
</tr>
<tr>
<td align="left">Drug</td>
<td align="left">Therapeutic group</td>
<td align="left"/>
<td align="center">x</td>
<td align="center">19</td>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="center">
<inline-formula id="inf2">
<mml:math id="m2">
<mml:mrow>
<mml:mi mathvariant="normal">&#x2211;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>11,237</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
<td align="center">
<inline-formula id="inf3">
<mml:math id="m3">
<mml:mrow>
<mml:mi mathvariant="normal">&#x2211;</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>437</mml:mn>
</mml:mrow>
</mml:math>
</inline-formula>
</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn id="Tfn1">
<p>Bold values indicate that the &#x201c;Feature origin&#x201d; is &#x201c;Claims Data&#x201d;.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>In this work, we propose a multimodal neural network architecture to reflect the specific structure of the augmented claims data (see <xref ref-type="fig" rid="F2">Figure&#x20;2</xref>). In this architecture, each of the feature domains and subdomains are initially treated as separate data modalities. Note that each feature derived from diagnosis and substance codes has an additional time stamp (30-day interval), that is, each subdomain is a three-dimensional data cube. Each of these tensors is projected down to a lower dimensional representation via bottleneck feedforward architecture with 1&#x2013;4 hidden layers, where the exact number of hidden layers and units per layer are treated as tunable hyperparameters in our framework (see details in <xref ref-type="sec" rid="s11">Supplementary Material</xref>). In conclusion, at the first layers for each subdomain, specific latent features are extracted in a nonlinear manner from the original data and subsequently concatenated.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>DeepLORI model architecture: The input is organized as a multimodal data cube, which is subdivided into several feature domains. Medication and diagnosis-related features are time-dependent, whereas features in the &#x201c;general&#x201d; domain are not. The three different colors at stage (3) symbolize the 3 different pooling/convolution kernel&#x20;sizes.</p>
</caption>
<graphic xlink:href="frai-04-610197-g002.tif"/>
</fig>
<p>After latent feature extraction, DeepLORI models the time-dependency in the data within each feature domain. For that purpose, we apply a pooling function (max or mean) over the entire time series simultaneously for all feature domains, but individually for each component of our one-hot vector representations. The exact choice of the pooling function is a hyperparameter. In addition to pooling, we allow for the application of different time convolutional kernels (with multiple filters per kernel), similar to a sliding window. Whether or not convolutional filters are applied and which sizes these filters have are again determined within hyperparameter optimization.</p>
<p>After modeling time-dependency, there is another feedforward bottleneck structure (same tunable design as for the initial latent feature extraction) in our network. Finally, DeepLORI concatenates latent features extracted from each feature domain and feeds them through the last feedforward bottleneck structure into one output unit, representing a patient-specific comorbidity risk score. That means we have one DeepLORI model per comorbidity. (A more detailed view on the DeepLORI architecture, including an overview of all tunable hyperparameters can be found in <xref ref-type="sec" rid="s11">Supplementary Material</xref>.)</p>
</sec>
<sec id="s3-1-2">
<title>Loss Function</title>
<p>Let the training data be denoted as <inline-formula id="inf4">
<mml:math id="m4">
<mml:mrow>
<mml:mi>D</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3b4;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
<mml:mtext>&#x2003;</mml:mtext>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:msup>
<mml:mi mathvariant="normal">&#x211d;</mml:mi>
<mml:mrow>
<mml:mi>d</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi>T</mml:mi>
</mml:mrow>
</mml:msup>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mi mathvariant="normal">&#x211d;</mml:mi>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>&#x3b4;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mn>0,1</mml:mn>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1,2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>n</mml:mi>
<mml:mo>,</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mo>&#xa0;</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1,2</mml:mn>
<mml:mo>,</mml:mo>
<mml:mo>&#x2026;</mml:mo>
<mml:mo>,</mml:mo>
<mml:mi>T</mml:mi>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, where <inline-formula id="inf5">
<mml:math id="m5">
<mml:mi>T</mml:mi>
</mml:math>
</inline-formula> is the maximum number of time stamps in the data (in our case, 15&#xa0;months) and <inline-formula id="inf6">
<mml:math id="m6">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is the observed time of the first diagnosis of a comorbidity (in case data are not censored) after the index date or the maximum observed event free time. Moreover, <inline-formula id="inf7">
<mml:math id="m7">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b4;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2208;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mn>0,1</mml:mn>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is a binary variable indicating whether <inline-formula id="inf8">
<mml:math id="m8">
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> is right-censored <inline-formula id="inf9">
<mml:math id="m9">
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b4;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> or not <inline-formula id="inf10">
<mml:math id="m10">
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>&#x3b4;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. Following <xref ref-type="bibr" rid="B23">Katzman et&#x20;al. (2018)</xref>, we here use the negative partial log-likelihood of a Cox proportional hazards model (<xref ref-type="bibr" rid="B8">Cox, 1972</xref>) as a loss function for training DeepLORI:<disp-formula id="equ1">
<mml:math id="m11">
<mml:mrow>
<mml:mi mathvariant="bold-italic">l</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">W</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="bold-italic">y</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">&#x3b4;</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mstyle>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mi mathvariant="bold-italic">W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>log</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">j</mml:mi>
<mml:mo>:</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">j</mml:mi>
</mml:msub>
<mml:mo>&#x2265;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:munder>
<mml:mrow>
<mml:mi mathvariant="bold">ex</mml:mi>
<mml:msup>
<mml:mi mathvariant="bold">p</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mi mathvariant="bold-italic">W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">j</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf11">
<mml:math id="m12">
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x22c5;</mml:mo>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> denotes the risk score learned by DeepLORI, parameterized by weights <inline-formula id="inf12">
<mml:math id="m13">
<mml:mi>W</mml:mi>
</mml:math>
</inline-formula>, and <inline-formula id="inf13">
<mml:math id="m14">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> the medical history of patient&#x20;<inline-formula id="inf14">
<mml:math id="m15">
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>
</p>
<p>Given <inline-formula id="inf15">
<mml:math id="m16">
<mml:mrow>
<mml:msub>
<mml:mi>N</mml:mi>
<mml:mi>W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x22c5;</mml:mo>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, the hazard of a patient with feature vector <italic>x</italic> at time <italic>t</italic> is<disp-formula id="equ2">
<mml:math id="m17">
<mml:mrow>
<mml:mi>h</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi>ex</mml:mi>
<mml:msup>
<mml:mi mathvariant="normal">p</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="italic">N</mml:mi>
<mml:mi mathvariant="italic">W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="italic">x</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf16">
<mml:math id="m18">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> is the so-called baseline hazard, which can be estimated according to (<xref ref-type="bibr" rid="B4">Breslow, 1972</xref>):<disp-formula id="equ3">
<mml:math id="m19">
<mml:mrow>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munderover>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>y</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x2264;</mml:mo>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:msub>
<mml:mi>&#x3b4;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msub>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">j</mml:mi>
<mml:mo>:</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">j</mml:mi>
</mml:msub>
<mml:mo>&#x2265;</mml:mo>
<mml:msub>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold">ex</mml:mi>
<mml:msup>
<mml:mi mathvariant="bold">p</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mi mathvariant="bold-italic">W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="bold-italic">x</mml:mi>
<mml:mrow>
<mml:mi mathvariant="bold-italic">j</mml:mi>
<mml:mo>&#x22c5;</mml:mo>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>The corresponding time-dependent conditional probability for staying event-free (i.e.,&#x20;not suffering from the specified comorbidity) is then<disp-formula id="equ4">
<mml:math id="m20">
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>t</mml:mi>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>x</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:mrow>
<mml:msubsup>
<mml:mo>&#x222b;</mml:mo>
<mml:mn>0</mml:mn>
<mml:mi>t</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mrow>
<mml:mi>ex</mml:mi>
<mml:msup>
<mml:mi mathvariant="normal">p</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="italic">N</mml:mi>
<mml:mi mathvariant="italic">W</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="italic">x</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
<mml:mtext>d</mml:mtext>
<mml:msub>
<mml:mi>h</mml:mi>
<mml:mn>0</mml:mn>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>u</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>To avoid over-fitting, we regularize DeepLORI during training in multiple ways:<list list-type="simple">
<list-item>
<p>&#x2022; We use dropout units in the input and hidden layers.</p>
</list-item>
<list-item>
<p>&#x2022; We perform batch normalization (<xref ref-type="bibr" rid="B20">Ioffe and Szegedy, 2015</xref>) before each activation function.</p>
</list-item>
<list-item>
<p>&#x2022; We impose groupwise elastic net penalties for weights (<xref ref-type="bibr" rid="B59">Zou and Hastie, 2005</xref>).</p>
</list-item>
</list>
</p>
<p>The elastic net is an extension of the classical lasso algorithm (<xref ref-type="bibr" rid="B50">Tibshirani, 1996</xref>), which has originally been introduced in the context of generalized linear models. It combines an <inline-formula id="inf17">
<mml:math id="m21">
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>penalty of coefficients (like in lasso regression) with an <inline-formula id="inf18">
<mml:math id="m22">
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>penalty (like in ridge regression) (<xref ref-type="bibr" rid="B18">Hoerl and Kennard, 1970</xref>). The elastic net enforces a sparse regression model by jointly pushing coefficients toward zero via the <inline-formula id="inf19">
<mml:math id="m23">
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>penalty, that is, there is a feature selection. At the same time, the <inline-formula id="inf20">
<mml:math id="m24">
<mml:mrow>
<mml:msub>
<mml:mi mathvariant="normal">&#x2113;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#xa0;</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula>penalty promotes a joint selection of correlated features (<xref ref-type="bibr" rid="B59">Zou and Hastie, 2005</xref>). The idea of the elastic net can also be extended to neural networks. More specifically, by adding groupwise elastic net penalties, we modify our training objective as follows:<disp-formula id="equ5">
<mml:math id="m25">
<mml:mrow>
<mml:mi>l</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">W</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi>y</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>s</mml:mi>
<mml:mi mathvariant="italic">&#x3f5;</mml:mi>
<mml:mi>S</mml:mi>
</mml:mrow>
</mml:munder>
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x2016;</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>W</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>&#x2016;</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:mstyle>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x2016;</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>W</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>&#x2016;</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x2016;</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>W</mml:mi>
<mml:mi>D</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>&#x2016;</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x2b;</mml:mo>
<mml:msubsup>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi>D</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:msub>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x2016;</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>W</mml:mi>
<mml:mi>D</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>&#x2016;</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:math>
</disp-formula>where <inline-formula id="inf21">
<mml:math id="m26">
<mml:mi>S</mml:mi>
</mml:math>
</inline-formula> is the set of feature subdomains. Furthermore, <inline-formula id="inf22">
<mml:math id="m27">
<mml:mrow>
<mml:msubsup>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:mo>,</mml:mo>
<mml:msubsup>
<mml:mi>&#x3bb;</mml:mi>
<mml:mi>s</mml:mi>
<mml:mrow>
<mml:msub>
<mml:mi>&#x2113;</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
</mml:math>
</inline-formula> denote tunable hyperparameters, <inline-formula id="inf23">
<mml:math id="m28">
<mml:mrow>
<mml:msub>
<mml:mi>W</mml:mi>
<mml:mi>s</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> refers to the set of weights connecting the input to the first hidden layer within feature domain <inline-formula id="inf24">
<mml:math id="m29">
<mml:mi>s</mml:mi>
</mml:math>
</inline-formula>, and <inline-formula id="inf25">
<mml:math id="m30">
<mml:mrow>
<mml:msub>
<mml:mi>W</mml:mi>
<mml:mi>D</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
</inline-formula> are the weights of the connections feeding into the output&#x20;layer.</p>
</sec>
<sec id="s3-1-3">
<title>Hyperparameters Optimization</title>
<p>A comprehensive overview of hyperparameters of DeepLORI can be found in the supplements (<xref ref-type="sec" rid="s11">Supplementary Table S2</xref>). We performed Bayesian hyperparameter optimization (<xref ref-type="bibr" rid="B2">Bergstra et&#x20;al., 2013</xref>) to tune DeepLORI on the training data. Each candidate hyperparameter set was evaluated via a 5-fold cross-validation. Hyperparameter optimization was run for 100 trials per fold, a maximum number of 100 epochs per trial, or if the cross-validated prediction performance did not increase within 10 sequential epochs. Prediction performance was measured via Harrell&#x2019;s C-index (<xref ref-type="bibr" rid="B16">Harrell et&#x20;al., 1982</xref>), which is a generalization of the area under the receiver operating characteristic curve (AUC), frequently used for classification models.</p>
</sec>
<sec id="s3-1-4">
<title>Shapley Additive Explanations</title>
<p>One of the main criticisms of neural network based approaches is the difficulty to interpret them. Recently, <xref ref-type="bibr" rid="B27">Lundberg and Lee (2017)</xref> proposed a model agnostic game theoretic framework to address this issue. In brief, the idea behind Shapley Additive Explanations (SHAP) is that the relevance <inline-formula id="inf26">
<mml:math id="m31">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3a6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> of feature <inline-formula id="inf27">
<mml:math id="m32">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula> on the model output <inline-formula id="inf28">
<mml:math id="m33">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> can be regarded as the average weighted difference between outputs from all possible models trained on 1) all subsets <italic>S</italic> of features including feature <inline-formula id="inf29">
<mml:math id="m34">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula>, against 2) all subsets of features excluding feature <inline-formula id="inf30">
<mml:math id="m35">
<mml:mi>i</mml:mi>
</mml:math>
</inline-formula>:<disp-formula id="equ6">
<mml:math id="m36">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3a6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mo>&#x2286;</mml:mo>
<mml:mi>F</mml:mi>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:mrow>
</mml:munder>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
<mml:mo>!</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>S</mml:mi>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>!</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mi>F</mml:mi>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
<mml:mo>!</mml:mo>
</mml:mrow>
</mml:mfrac>
<mml:mrow>
<mml:mo>[</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mo>&#x222a;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mrow>
<mml:mi>S</mml:mi>
<mml:mo>&#x222a;</mml:mo>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mi>i</mml:mi>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:msub>
<mml:mi>f</mml:mi>
<mml:mi>S</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>x</mml:mi>
<mml:mi>S</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>]</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:math>
</disp-formula>with <inline-formula id="inf31">
<mml:math id="m37">
<mml:mi>F</mml:mi>
</mml:math>
</inline-formula> as the set of all features. The authors propose several local approximation techniques, which can circumvent the exact combinatorial calculation of <inline-formula id="inf32">
<mml:math id="m38">
<mml:mrow>
<mml:msub>
<mml:mi>&#x3a6;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</inline-formula> one which is specifically tailored toward neural networks (Deep SHAP). Deep SHAP effectively combines SHAP values calculated for smaller components of a neural network into SHAP values for the entire network. We refer to <xref ref-type="bibr" rid="B27">Lundberg and Lee (2017)</xref> for details. In this work, we used SHAP to understand the impact of individual feature domains, subdomains, and AEDs on the comorbidity risk score that we learned via DeepLORI. SHAP results in a patient-specific score that may be positive [feature <italic>i</italic> increases <italic>f</italic>(<italic>x</italic>)] or negative [feature <italic>i</italic> decreases <italic>f</italic>(<italic>x</italic>)] compared to the average patient. In agreement to Lundberg et&#x20;al., we considered the mean absolute values of the SHAP values per feature to score the overall impact of a variable. Moreover, we investigated the overall mean absolute SHAP values per feature domain and subdomain, respectively. This is possible because SHAP values are additive. That means the sum of two SHAP values can indeed be interpreted as the overall impact of the corresponding features.</p>
<p>In practice, we found Deep SHAP too computationally costly when using our entire original dataset. We thus repeatedly subsampled 5% of our data with replacement (30 times) and recalculated SHAP values. We checked the robustness of the approach via the variance of SHAP values.</p>
</sec>
</sec>
<sec id="s3-2">
<title>Competing Methods</title>
<p>We compared DeepLORI against several competing approaches:<list list-type="simple">
<list-item>
<p>(1) Random survival forests (<xref ref-type="bibr" rid="B21">Ishwaran et&#x20;al., 2008</xref>): In this earlier published approach (<xref ref-type="bibr" rid="B14">Gerlach et&#x20;al., 2017</xref>), we first combined claims data with biomedical knowledge (akin to this article) and then used a window of fixed length (3&#xb0;months) to summarize features via a max-pooling. Features encoding prescriptions and diagnoses within such a time window were concatenated, resulting in an overall number of around 165,000 features per patient. Subsequently, we used maximum relevance minimum redundancy (mRMR) (<xref ref-type="bibr" rid="B10">Ding and Peng, 2005</xref>) to further reduce the number of features to 500 prior to random survival forest (RSF) model training. For RSF model training, we relied on R-package &#x201c;ranger&#x201d; (<xref ref-type="bibr" rid="B56">Wright and Ziegler, 2017</xref>). The number of decision trees was set to 5,000, and the log-rank statistic was used as a split rule for&#x20;nodes.</p>
</list-item>
<list-item>
<p>(2) Stacked denoising autoencoders (SDAs) followed by training an RSF (<xref ref-type="bibr" rid="B30">Miotto et&#x20;al., 2016</xref>): In this approach, initially an SDA was trained to extract features from the medical history of each patient (diagnosis and prescription codes as well as demographic information) in an unsupervised manner. The same SDA architecture as described in Miotto et&#x20;al. was employed. After feature extraction for each of the 6 comorbidities, an RSF was trained.</p>
</list-item>
<list-item>
<p>(3) A Kaplan&#x2013;Meier (KM) estimator as &#x201c;null model.&#x201d; This approach does not use features of any individual. It only estimates the overall risk curve for a given comorbidity from the data and applies the same estimate to each patient. The purpose of this &#x201c;null model&#x201d; was to understand the added value of complex machine learning models.</p>
</list-item>
</list>
</p>
</sec>
<sec id="s3-3">
<title>Evaluation Approach</title>
<p>DeepLORI was compared with competing methods within a 5-fold cross-validation scheme using the exactly same data splits of the original dataset. Hyperparameters were only tuned on the respective training data, resulting in a nested cross-validation scheme for DeepLORI. We used Uno&#x2019;s C-index (<xref ref-type="bibr" rid="B51">Uno et&#x20;al., 2011</xref>) as a performance measure:<disp-formula id="equ7">
<mml:math id="m39">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>C</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mi>&#x3c4;</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>&#x394;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>G</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mstyle>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3c;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mo stretchy="true">&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3e;</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi>r</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>k</mml:mi>
</mml:mrow>
<mml:mo stretchy="true">&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:msubsup>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mi>j</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:msubsup>
<mml:mrow>
<mml:msub>
<mml:mi>&#x394;</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>G</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mstyle>
<mml:mi>I</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3c;</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>j</mml:mi>
</mml:msub>
<mml:mo>,</mml:mo>
<mml:msub>
<mml:mi>X</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
<mml:mo>&#x3c;</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</disp-formula>
</p>
<p>Uno&#x2019;s C-index is a consistent estimator of the concordance index for a population that is independent of censoring. It satisfies this requirement for censored populations using two &#x201c;tricks,&#x201d; first by applying an &#x201c;inverse probability weighting&#x201d; schema using the censoring distribution estimated with <inline-formula id="inf33">
<mml:math id="m40">
<mml:mrow>
<mml:mrow>
<mml:mover accent="true">
<mml:mi>G</mml:mi>
<mml:mo>&#x5e;</mml:mo>
</mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mo>&#x22c5;</mml:mo>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> (e.g., the Kaplan&#x2013;Meier estimator), second by evading instable tail parts for times <inline-formula id="inf34">
<mml:math id="m41">
<mml:mrow>
<mml:mo>&#x2265;</mml:mo>
<mml:mi>&#x3c4;</mml:mi>
</mml:mrow>
</mml:math>
</inline-formula> of the estimated survival function with a prespecified time point <inline-formula id="inf35">
<mml:math id="m42">
<mml:mi>&#x3c4;</mml:mi>
</mml:math>
</inline-formula> as constraint. We refer to <xref ref-type="bibr" rid="B51">Uno et&#x20;al. (2011)</xref> for further details.</p>
<p>In addition, we evaluated DeepLORI on our external validation data. This validation was done separately in two different ways:<list list-type="simple">
<list-item>
<p>(1) Follow-up of existing patients: We selected patients who had already been in our original dataset, but for whom a right censoring was observed.</p>
</list-item>
<list-item>
<p>(2) New patients: We evaluated DeepLORI on patients who had no records in the original dataset.</p>
</list-item>
</list>
</p>
<p>In both cases, we recorded Uno&#x2019;s C-index over the entire time series and as a function of time (named <inline-formula id="inf36">
<mml:math id="m43">
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>U</mml:mi>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula> in the following) to measure the prediction performance.</p>
</sec>
</sec>
<sec sec-type="results" id="s4">
<title>Results</title>
<sec id="s4-1">
<title>DeepLORI Outperforms Competing Methods</title>
<p>Despite high censoring rates, all 6 comorbidities could be predicted rather accurately by DeepLORI, and the 5-fold cross-validated performance of Uno&#x2019;s C-index ranged from 71% for overweight and obesity to 77% for stroke and ischemic attacks (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>; <xref ref-type="sec" rid="s11">Supplementary Table S3</xref>). At the same time, the Kaplan&#x2013;Meier estimator (i.e.,&#x20;the &#x201c;null&#x201d;-model without any features) was consistently at the chance level (50% Uno&#x2019;s C-index), indicating that all of our tested machine learning models (DeepPatient, DeepLORI, and MRMR &#x2b; RSF) extracted relevant predictive signal from the data. At the same time, DeepLORI showed significantly higher C-indices than all competing methods.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Five-fold (nested) cross-validation test sets performance benchmark of Deep LORI (green) vs. competing methods; mRMR: minimum redundancy maximum relevance feature selection; SDAE: stacked denoising autoencoder; RSF: random survival forest; KM: Kaplan&#x2013;Meier estimator.</p>
</caption>
<graphic xlink:href="frai-04-610197-g003.tif"/>
</fig>
</sec>
<sec id="s4-2">
<title>DeepLORI Shows Stable Prediction Performance on External Validation Data</title>
<p>Evaluation of DeepLORI on the external validation data showed roughly comparable C-indices to those observed on the original data when focusing on the follow-up of the &#x223c;15,000 patients, who had medical history in the original data (<xref ref-type="fig" rid="F4">Figure&#x20;4</xref>). This highlights that DeepLORI, despite high censoring rates in the original data, was not over-fitted. C-indices for new/so far unseen patients (<italic>n</italic>&#x20;&#x3d; &#x223c;97,000) in the external validation data were around 6% lower (<xref ref-type="sec" rid="s11">Supplementary Table&#x20;S3</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Prediction performance of Deep LORI on external validation data. Green: time-split validation, that is, follow-up of patients included in training data. Blue: prediction performance on new patient data. Red: 5-fold cross-validated prediction performance on original data for comparison purposes.</p>
</caption>
<graphic xlink:href="frai-04-610197-g004.tif"/>
</fig>
<p>When investigating the <inline-formula id="inf37">
<mml:math id="m44">
<mml:mrow>
<mml:mi>A</mml:mi>
<mml:mi>U</mml:mi>
<mml:mi>C</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>t</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>, we found a rather stable prediction performance for all comorbidities over time (<xref ref-type="fig" rid="F5">Figure&#x20;5</xref>). Remarkably, this held true for a time interval of up to 6&#xb0;years after initial diagnosis of epilepsy, and it was true for the follow-up of existing patients as well as for new patients, again highlighting the fact that DeepLORI generalizes rather&#x20;well.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Time-dependent prediction performance (AUC(t)) of DeepLORI on external validation&#x20;data.</p>
</caption>
<graphic xlink:href="frai-04-610197-g005.tif"/>
</fig>
</sec>
<sec id="s4-3">
<title>DeepLORI Models Are Explainable</title>
<p>We next investigated the relevance of feature domains via SHAP in DeepLORI models trained on the entire original dataset. This analysis highlighted for most comorbidities the relevance of features derived via augmentation of the original data with additional information (<xref ref-type="fig" rid="F6">Figure&#x20;6</xref>): For example, in the model, predicting anxiety augmented features made up around 55% of the total feature importance, and for migraine, we found 43%. Notably, among augmented features, the &#x201c;medical risk&#x201d; subdomain, covering various unspecific comorbidity indices derived from ICD diagnosis codes (<xref ref-type="bibr" rid="B6">Charlson et&#x20;al., 1987</xref>; <xref ref-type="bibr" rid="B41">Romano et&#x20;al., 1993</xref>; <xref ref-type="bibr" rid="B26">Lee et&#x20;al., 1999</xref>; <xref ref-type="bibr" rid="B43">Schneeweiss et&#x20;al., 2003</xref>; <xref ref-type="bibr" rid="B3">Boersma et&#x20;al., 2005</xref>; <xref ref-type="bibr" rid="B37">Quan et&#x20;al., 2005</xref>; <xref ref-type="bibr" rid="B45">Sessler et&#x20;al., 2010</xref>; <xref ref-type="bibr" rid="B46">Sigakis et&#x20;al., 2013</xref>) using the R-package &#x201c;medicalrisk&#x201d; (<xref ref-type="bibr" rid="B29">McCormick and Joseph, 2020</xref>) in the medical history of epilepsy patients, had a significant impact (<xref ref-type="fig" rid="F7">Figure&#x20;7</xref>), suggesting that the risk of developing any of our six comorbidities increases with a generally worse medical condition upfront. Importantly, none of the comorbidity indices are specific to any of the six comorbidities focused by DeepLORI.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Relative impact of original vs augmented features in DeepLORI models for 6 different comorbidities</p>
</caption>
<graphic xlink:href="frai-04-610197-g006.tif"/>
</fig>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>SHAP values by feature subdomain. Subdomains with a cumulative relative importance <inline-formula id="inf38">
<mml:math id="m45">
<mml:mrow>
<mml:mo>&#x2264;</mml:mo>
<mml:mn>5</mml:mn>
<mml:mtext>%</mml:mtext>
</mml:mrow>
</mml:math>
</inline-formula> are not&#x20;shown.</p>
</caption>
<graphic xlink:href="frai-04-610197-g007.tif"/>
</fig>
<p>In the following, we discuss one of the six DeepLORI models in more detail, namely, the one for migraine (<xref ref-type="fig" rid="F8">Figure&#x20;8</xref>). (Figures related to DeepLORI models for the other five comorbidities can be found in the <xref ref-type="sec" rid="s11">Supplementary Material</xref> (<xref ref-type="sec" rid="s11">Supplementary Figures S1&#x2013;S6</xref>)). According to SHAP analysis, the most relevant features in the DeepLORI model for migraine relate to the prior existence of headaches and the use of drugs for the nervous system, which are typically used to treat headaches. In addition, many drugs used for treating headaches are known to affect the liver (<xref ref-type="bibr" rid="B28">Mathew and Klein, 2019</xref>; <xref ref-type="bibr" rid="B52">Valade, 2019</xref>). It is known that females are more affected by migraine than males, and that migraine is age-dependent (<xref ref-type="bibr" rid="B54">Victor et&#x20;al., 2010</xref>). The antiepileptic drug (AED) topiramate, known to be well-tolerated by this group of patients (<xref ref-type="bibr" rid="B48">Spritzer et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B47">Silberstein, 2017</xref>), ranks among the top 15 most relevant features. <xref ref-type="fig" rid="F9">Figure&#x20;9</xref> shows the marginal dependency of DeepLORI model predictions on AED prescription frequency, suggesting that patients treated with topiramate are slightly more likely to be diagnosed with migraine later than those without such treatment in the past. In fact, topiramate is often used as a preventive treatment for migraine (<xref ref-type="bibr" rid="B48">Spritzer et&#x20;al., 2016</xref>), suggesting that patients treated with this AED are often considered at risk of developing migraine by their treating physician. Indeed, many of these patients eventually receive this diagnosis.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>SHAP values of top 15 most relevant features in the DeepLORI model for migraine, rank by mean absolute values. <italic>x</italic>-axis: SHAP values, higher values &#x3d; higher importance. <italic>y</italic>-axis: features ranked by importance, annotated with their domain and subdomain membership (domain &#x3e; subdomain &#x3e; feature).</p>
</caption>
<graphic xlink:href="frai-04-610197-g008.tif"/>
</fig>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Plot shows the marginal dependency of the frequency of topiramate prescription on the predicted risk on later migraine diagnosis. One dot represents one patient; <italic>x</italic>-axis: prescription frequency (0% &#x3d; never observed, 100% &#x3d; observed every month of a patient&#x2018;s medical history); <italic>y</italic>-axis: change in SHAP value (&#x3d;change in individual hazard rate). Marginal dependency plots for each comorbidity for the top 5 features can be found in the <xref ref-type="sec" rid="s11">Supplemental Material</xref> (<xref ref-type="sec" rid="s11">Supplementary Figures S7&#x2013;S12</xref>).</p>
</caption>
<graphic xlink:href="frai-04-610197-g009.tif"/>
</fig>
<p>Another interesting finding from the SHAP analysis of our model is the influence of disorders of the lipoid metabolism on migraine risk. Associations between lipid levels and migraine have been reported in <xref ref-type="bibr" rid="B39">Rist et&#x20;al. (2011)</xref> and <xref ref-type="bibr" rid="B33">Onderwater et&#x20;al. (2019)</xref>. Moreover, the metabolic syndrome and migraine have been associated with each other (<xref ref-type="bibr" rid="B42">Sachdev and Marmura, 2012</xref>). It is important to highlight at this point that SHAP analysis does not provide a causal explanation, though.</p>
<p>To further exemplify the possibility of interpreting our DeepLORI models on the level of individual patients, we depict in <xref ref-type="fig" rid="F10">Figure&#x20;10</xref> SHAP values for two randomly selected patients with high and low risk for developing stroke or ischemic attacks, respectively. As expected, the low-risk patient is young and has no diagnosis of hypertension or disorder of the metabolic system. In contrast, the high-risk patient is an older person with hypertension who lives in Texas. In fact, significant regional differences in the risk for strokes have been reported throughout the United&#x20;States (<xref ref-type="bibr" rid="B19">Howard et&#x20;al., 2007</xref>), and Eastern Texas belongs to the so-called &#x201c;Stroke Belt&#x201d; (<xref ref-type="bibr" rid="B22">Karp David et&#x20;al., 2016</xref>).</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Examples of SHAP explanations for a patient predicted at low risk for stroke and ischemic attacks <bold>(left)</bold> and a high-risk patient <bold>(right)</bold>. Red (green) bars indicate higher <bold>(lower)</bold> risk than the average patient: The hazard ratio<xref ref-type="fn" rid="fn2">
<sup>2</sup>
</xref> of the low-risk patient <bold>(left)</bold> is around 56% of that of an average patient <inline-formula id="inf39">
<mml:math id="m46">
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mrow>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>17.29</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>16.71</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>0.56</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>. The hazard ratio of the high-risk patient <bold>(right)</bold> is around 2.94&#x20;times that of an average patient <inline-formula id="inf40">
<mml:math id="m47">
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mrow>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>15.63</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>/</mml:mo>
<mml:mrow>
<mml:mi>exp</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mn>16.71</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>2.94</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
</inline-formula>.</p>
</caption>
<graphic xlink:href="frai-04-610197-g010.tif"/>
</fig>
</sec>
</sec>
<sec id="s5">
<title>Discussion and Conclusion</title>
<p>Precision medicine has the vision to bring the right treatment to the right patients. Precision medicine is strongly dependent on machine learning. At present, precision medicine is only an emerging reality. Several reasons can be identified (<xref ref-type="bibr" rid="B13">Fr&#xf6;hlich et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B31">Miotto et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B57">Xiao et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B25">Kwak and Hui, 2020</xref>): 1) lack of the right data in sufficient quantity, 2) insufficient validation, and 3) difficulties in interpreting complex ML models, which is by itself a prerequisite for generating the necessary confidence in using such models. Realization of precision medicine will only be possible, if all these aspects are addressed jointly. In this context, it is essential that ML models can be used in a cost-effective and practical manner. Hence, clinical routine data are of extreme relevance and are gaining more and more attention (<xref ref-type="bibr" rid="B55">Weiss et&#x20;al., 2012</xref>; <xref ref-type="bibr" rid="B36">Peissig et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B7">Choi et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B30">Miotto et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B38">Rajkomar et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B17">Harutyunyan et&#x20;al., 2019</xref>). Administrative claims data constitute an important source of such clinical routine data. They principally exist in large quantities and allow for obtaining insights into the longitudinal medical history of individual patients under real-world conditions. However, these data have not been collected for research purposes. First of all, coding of diagnoses into ICD codes is not unique and mostly done for maximizing economic reasons, rather than for providing a precise medical description. Different ICD codes can be used for similar diagnoses, and the relationship among different medical conditions is consequently not always uniquely resolvable from their distances in the ICD ontology. Second, it should be noted that ICD only reflects the medical symptom level, which should not be confused with the biological relationship among disorders. Third, the time of diagnosis encoding might not correspond to the actual appearance of the medical condition. Fourth, it is unclear whether patients take the prescribed medication. Finally, the nature of irregular time series data, different for each patient, imposes specific challenges for data analysis.</p>
<p>In this work, we tried to address these challenges by a) mapping ICD codes to PheWAS codes that are at higher granularity, b) augmenting the original data with further information from biological databases, and c) proposing specific multimodal neural network architecture (DeepLORI). We demonstrated that DeepLORI can predict six common comorbidities of epilepsy patients with higher C-index than several competing methods. We performed a rigorous cross-validation plus an external validation to assess our model, demonstrating that DeepLORI allows for reliable predictions of comorbidity risks up to six years in advance. We showed that with the help of SHAP and our data augmentation approach, it is possible to make DeepLORI-based predictions explainable, even on the level of individual patients. From our perspective, this is of great importance for generating confidence in ML-based solutions in medicine.</p>
<p>From a medical perspective, we see the value of our work in the potential for much earlier identification of epilepsy patients at risk of developing different comorbidities. For example, a patient at high risk of developing diabetes type 2 should consider losing weight and regularly check insulin levels. A patient at high risk of developing psychiatric disorders might consider early consultation with a psychiatrist. Hence, risk models could be a way to eventually move toward preventive medicine.</p>
<p>Further applications of our work could lie in addressing the high subject-to-subject variability in epilepsy: Based on the comorbidity risk profile learned by DeepLORI, one might be able to identify subgroups of patients with more homogenous disease progression, potentially opening up opportunities for developing more personalized therapies in the future.</p>
</sec>
</body>
<back>
<sec id="s6">
<title>Data Availability Statement</title>
<p>The data analyzed in this study are subject to the following licenses/restrictions: We used administrative health claims data provided by IBM Truven Health Analytics. Data access has to be requested from IBM. The DeepLORI framework is now available at <ext-link ext-link-type="uri" xlink:href="https://gitlab.scai.fraunhofer.de/thomas.linden/deeplori">https://gitlab.scai.fraunhofer.de/thomas.linden/deeplori</ext-link>. The readme contains instructions for a setup and demo. The demo simulates patients who are accessible from the described folder. Requests to access these datasets should be directed to <ext-link ext-link-type="uri" xlink:href="https://www.ibm.com/products/marketscan-research-databases">https://www.ibm.com/products/marketscan-research-databases</ext-link>, <ext-link ext-link-type="uri" xlink:href="https://www.ibm.com/watson-health/about/truven-health-analytics">https://www.ibm.com/watson-health/about/truven-health-analytics</ext-link>.</p>
</sec>
<sec id="s7">
<title>Ethics Statement</title>
<p>The studies involving human participants were reviewed and approved by UCB internal Ethics Office. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s8">
<title>Author Contributions</title>
<p>Designed and supervised the project: HF; extracted the data: CL, VK, and KH; analyzed the data: TL and JJ; performed experiments: TL; interpreted the data and results: TL and HF; and drafted the manuscript: TL and HF. All authors have read the manuscript and agreed to its content.</p>
</sec>
<sec id="s9">
<title>Funding</title>
<p>This work was funded Fraunhofer internally.</p>
</sec>
<sec sec-type="COI-statement" id="s10">
<title>Conflict of Interest</title>
<p>The authors TL, JJ, KH, and HF were employed by the company UCB Biosciences GmbH, and CL and VK were employed by the company UCB Ltd. All authors have received salaries from UCB Pharma S.A. during the runtime of this project. UCB had no influence on the scientific content of this work. Most of the presented work has been done, while the first and last authors were affiliated with UCB Biosciences GmbH, Monheim.</p>
</sec>
<ack>
<p>We like to thank Linda Kalilani and Babak Boroorjerdi for helpful discussions and support of the entire project.</p>
</ack>
<sec id="s11">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/frai.2021.610197/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/frai.2021.610197/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<sec id="s12">
<title>Abbreviations</title>
<p>AED, antiepileptic drug; SDA, stacked denoising autoencoder; mRMR, minimum redundancy maximum relevance; RSF, random survival forest.</p>
</sec>
<fn-group>
<fn id="fn1">
<label>1</label>
<p>
<ext-link ext-link-type="uri" xlink:href="http://www.tdrdata.com/ipd/ipd">http://www.tdrdata.com/ipd/ipd</ext-link> ICD10ToICD9List</p>
</fn>
<fn id="fn2">
<label>2</label>
<p>Hazard ratios computed similar to Cox proportional hazard&#x0027;s model (<xref ref-type="bibr" rid="B8">Cox, 1972</xref>).</p>
</fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>An</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Malhotra</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Dilley</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Han-Burgess</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Valdez</surname>
<given-names>J.&#x20;N.</given-names>
</name>
<name>
<surname>Robertson</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Predicting Drug-Resistant Epilepsy - A Machine Learning Approach Based on Administrative Claims Data</article-title>. <source>Epilepsy Behav.</source> <volume>89</volume>, <fpage>118</fpage>&#x2013;<lpage>125</lpage>. <pub-id pub-id-type="doi">10.1016/j.yebeh.2018.10.013</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Bergstra</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yamins</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Cox</surname>
<given-names>D. D.</given-names>
</name>
</person-group> (<year>2013</year>). &#x201c;<article-title>Making a Science of Model Search: Hyperparameter Optimization in Hundreds of Dimensions for Vision Architectures</article-title>,&#x201d; in <conf-name>Proceedings of the 30th International Conference on Machine Learning -Volume 28</conf-name>, <conf-loc>Atlanta, GA</conf-loc>, <conf-date>June, 2013</conf-date>. <publisher-name>JMLR.org (ICML&#x2019;13)</publisher-name>, <fpage>I115</fpage>&#x2013;<lpage>I123</lpage>. </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boersma</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Kertai</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Schouten</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Bax</surname>
<given-names>J.&#x20;J.</given-names>
</name>
<name>
<surname>Noordzij</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Steyerberg</surname>
<given-names>E. W.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Perioperative Cardiovascular Mortality in Noncardiac Surgery: Validation of the Lee Cardiac Risk Index</article-title>. <source>Am. J.&#x20;Med.</source> <volume>118</volume> (<issue>10</issue>), <fpage>1134</fpage>&#x2013;<lpage>1141</lpage>. <pub-id pub-id-type="doi">10.1016/j.amjmed.2005.01.064</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breslow</surname>
<given-names>N. E.</given-names>
</name>
</person-group> (<year>1972</year>). <article-title>&#x2018;Discussion on Professor Cox&#x2019;s Paper&#x2019;</article-title>. <source>J.&#x20;R. Stat. Soc. Ser. B (Methodological)</source>, <volume>34</volume> (<issue>2</issue>), pp. <fpage>202</fpage>&#x2013;<lpage>220</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1972.tb00900.x</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Carroll</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Bastarache</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Denny</surname>
<given-names>J.&#x20;C.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>R PheWAS: Data Analysis and Plotting Tools for Phenome-wide Association Studies in the R Environment</article-title>. <source>Bioinformatics</source> <volume>30</volume> (<issue>16</issue>), <fpage>2375</fpage>&#x2013;<lpage>2376</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu197</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Charlson</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Pompei</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ales</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>MacKenzie</surname>
<given-names>C. R.</given-names>
</name>
</person-group> (<year>1987</year>). <article-title>A New Method of Classifying Prognostic Comorbidity in Longitudinal Studies: Development and Validation</article-title>. <source>J.&#x20;Chronic Dis.</source> <volume>40</volume> (<issue>5</issue>), <fpage>373</fpage>&#x2013;<lpage>383</lpage>. <pub-id pub-id-type="doi">10.1016/0021-9681(87)90171-8</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Choi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bahadori</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Schuetz</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Stewart</surname>
<given-names>W. F.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Doctor AI: Predicting Clinical Events via Recurrent Neural Networks</article-title>. <source>arXiv:1511.05942 [cs]</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1511.05942">http://arxiv.org/abs/1511.05942</ext-link>
</comment>. </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Cox</surname>
<given-names>D. R.</given-names>
</name>
</person-group> (<year>1972</year>). <article-title>Regression Models and Life-Tables</article-title>. <source>J.&#x20;R. Stat. Soc. Ser. B (Methodological)</source> <volume>34</volume> (<issue>2</issue>), <fpage>187</fpage>&#x2013;<lpage>202</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1972.tb00899.x</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Desai</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S. V.</given-names>
</name>
<name>
<surname>Vaduganathan</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Evers</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Schneeweiss</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Comparison of Machine Learning Methods with Traditional Models for Use of Administrative Claims with Electronic Medical Records to Predict Heart Failure Outcomes</article-title>. <source>JAMA Netw. Open</source> <volume>3</volume> (<issue>1</issue>), <fpage>e1918962</fpage>. <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2019.18962</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ding</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Peng</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Minimum Redundancy Feature Selection from Microarray Gene Expression Data</article-title>. <source>J.&#x20;Bioinform. Comput. Biol.</source> <volume>03</volume> (<issue>2</issue>), <fpage>185</fpage>&#x2013;<lpage>205</lpage>. <pub-id pub-id-type="doi">10.1142/s0219720005001004</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dworzynski</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Aasbrenn</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Rostgaard</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Melbye</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gerds</surname>
<given-names>T. A.</given-names>
</name>
<name>
<surname>Hjalgrim</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Nationwide Prediction of Type 2 Diabetes Comorbidities</article-title>. <source>Sci. Rep.</source> <volume>10</volume> (<issue>1</issue>), <fpage>1776</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-58601-7</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Engels</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Reber</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Lindlbauer</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Rapp</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>B&#xfc;chele</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Klenk</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Osteoporotic Hip Fracture Prediction from Risk Factors Available in Administrative Claims Data - A Machine Learning Approach</article-title>. <source>PLOS ONE</source> <volume>15</volume> (<issue>5</issue>), <fpage>e0232969</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0232969</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fr&#xf6;hlich</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Balling</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Beerenwinkel</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Kohlbacher</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lengauer</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>From Hype to Reality: Data Science Enabling Personalized Medicine</article-title>. <source>BMC Med.</source> <volume>16</volume> (<issue>1</issue>), <fpage>150</fpage>. <pub-id pub-id-type="doi">10.1186/s12916-018-1122-7</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Gerlach</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Fr&#xf6;hlich</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). &#x201c;<article-title>Predicting Comorbidities of Epilepsy Patients Using Big Data from Electronic Health Records Combined with Biomedical Knowledge</article-title>,&#x201d; in <conf-name>Proceedings of the GCB German Conference on Bioinformatics 2017</conf-name>, <conf-date>September 18&#x2013;21, 2017</conf-date>, <conf-loc>T&#xfc;bingen, Germany</conf-loc>. <publisher-name>PeerJ Inc</publisher-name>. </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Glauser</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Santel</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>DelBello</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Faist</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Toon</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Clark</surname>
<given-names>P.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Identifying Epilepsy Psychiatric Comorbidities with Machine Learning</article-title>. <source>Acta Neurol. Scand.</source> <volume>141</volume> (<issue>5</issue>), <fpage>388</fpage>&#x2013;<lpage>396</lpage>. <pub-id pub-id-type="doi">10.1111/ane.13216</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harrell</surname>
<given-names>F. E.</given-names>
</name>
<name>
<surname>Califf</surname>
<given-names>R. M.</given-names>
</name>
<name>
<surname>Pryor</surname>
<given-names>D. B.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K. L.</given-names>
</name>
<name>
<surname>Rosati</surname>
<given-names>R. A.</given-names>
</name>
</person-group> (<year>1982</year>). <article-title>Evaluating the Yield of Medical Tests</article-title>. <source>JAMA</source> <volume>247</volume> (<issue>18</issue>), <fpage>2543</fpage>&#x2013;<lpage>2546</lpage>. <pub-id pub-id-type="doi">10.1001/jama.247.18.2543</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Harutyunyan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Khachatrian</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kale</surname>
<given-names>D. C.</given-names>
</name>
<name>
<surname>Ver Steeg</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Galstyan</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Multitask Learning and Benchmarking with Clinical Time Series Data</article-title>. <source>Sci. Data</source> <volume>6</volume> (<issue>1</issue>), <fpage>96</fpage>. <pub-id pub-id-type="doi">10.1038/s41597-019-0103-9</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hoerl</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Kennard</surname>
<given-names>R. W.</given-names>
</name>
</person-group> (<year>1970</year>). <article-title>Ridge Regression: Biased Estimation for Nonorthogonal Problems</article-title>. <source>Technometrics</source> <volume>12</volume> (<issue>1</issue>), <fpage>55</fpage>&#x2013;<lpage>67</lpage>. <pub-id pub-id-type="doi">10.1080/00401706.1970.10488634</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Howard</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Labarthe</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yoon</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Howard</surname>
<given-names>V. J.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Regional Differences in African Americans&#x27; High Risk for Stroke: The Remarkable Burden of Stroke for Southern African Americans</article-title>. <source>Ann. Epidemiol.</source> <volume>17</volume> (<issue>9</issue>), <fpage>689</fpage>&#x2013;<lpage>696</lpage>. <pub-id pub-id-type="doi">10.1016/j.annepidem.2007.03.019</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ioffe</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Szegedy</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Batch Normalization: Accelerating Deep Network Training by Reducing Internal Covariate Shift</article-title>. <source>arXiv:1502.03167 [cs]</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1502.03167">http://arxiv.org/abs/1502.03167</ext-link>
</comment> (<comment>Accessed April 17, 2018</comment>). </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ishwaran</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kogalur</surname>
<given-names>U. B.</given-names>
</name>
<name>
<surname>Blackstone</surname>
<given-names>E. H.</given-names>
</name>
<name>
<surname>Lauer</surname>
<given-names>M. S.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>Random Survival Forests</article-title>. <source>Ann. Appl. Stat.</source> <volume>2</volume>, <fpage>841</fpage>&#x2013;<lpage>860</lpage>. <pub-id pub-id-type="doi">10.1214/08-AOAS169</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Karp</surname>
<given-names>D. N.</given-names>
</name>
<name>
<surname>Wolff</surname>
<given-names>C. S.</given-names>
</name>
<name>
<surname>Wiebe</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Branas</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Carr</surname>
<given-names>B. G.</given-names>
</name>
<name>
<surname>Mullen</surname>
<given-names>M. T.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Reassessing the Stroke Belt</article-title>. <source>Stroke</source> <volume>47</volume> (<issue>7</issue>), <fpage>1939</fpage>&#x2013;<lpage>1942</lpage>. <pub-id pub-id-type="doi">10.1161/STROKEAHA.116.012997</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Katzman</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Shaham</surname>
<given-names>U.</given-names>
</name>
<name>
<surname>Cloninger</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bates</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Kluger</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>DeepSurv: Personalized Treatment Recommender System Using A Cox Proportional Hazards Deep Neural Network</article-title>. <source>BMC Med. Res. Methodol.</source> <volume>18</volume> (<issue>1</issue>). <pub-id pub-id-type="doi">10.1186/s12874-018-0482-1</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Keezer</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Sisodiya</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Sander</surname>
<given-names>J.&#x20;W.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Comorbidities of Epilepsy: Current Concepts and Future Perspectives</article-title>. <source>Lancet Neurol.</source> <volume>15</volume> (<issue>1</issue>), <fpage>106</fpage>&#x2013;<lpage>115</lpage>. <pub-id pub-id-type="doi">10.1016/S1474-4422(15)00225-2</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kwak</surname>
<given-names>G. H.</given-names>
</name>
<name>
<surname>Hui</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>DeepHealth: Review and Challenges of Artificial Intelligence in Health Informatics</article-title>. <source>arXiv:1909.00384 [cs, eess, stat]</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1909.00384">http://arxiv.org/abs/1909.00384</ext-link>
</comment> (<comment>Accessed August 18, 2020</comment>). </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>T. H.</given-names>
</name>
<name>
<surname>Marcantonio</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Mangione</surname>
<given-names>C. M.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Polanczyk</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Cook</surname>
<given-names>E. F.</given-names>
</name>
<etal/>
</person-group> (<year>1999</year>). <article-title>Derivation and Prospective Validation of a Simple Index for Prediction of Cardiac Risk of Major Noncardiac Surgery</article-title>. <source>Circulation</source> <volume>100</volume> (<issue>10</issue>), <fpage>1043</fpage>&#x2013;<lpage>1049</lpage>. <pub-id pub-id-type="doi">10.1161/01.cir.100.10.1043</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lundberg</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>S.-I.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>A Unified Approach to Interpreting Model Predictions</article-title>. <source>arXiv:1705.07874 [cs, stat]</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="http://arxiv.org/abs/1705.07874">http://arxiv.org/abs/1705.07874</ext-link>
</comment> (<comment>Accessed July 30, 2019</comment>). </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mathew</surname>
<given-names>P. G.</given-names>
</name>
<name>
<surname>Klein</surname>
<given-names>B. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Getting to the Heart of the Matter: Migraine, Triptans, DHE, Ditans, CGRP Antibodies, First/Second&#x2010;Generation Gepants, and Cardiovascular Risk</article-title>. <source>Headache: J.&#x20;Head Face Pain</source> <volume>59</volume>, <fpage>1421</fpage>&#x2013;<lpage>1426</lpage>. <pub-id pub-id-type="doi">10.1111/head.13601</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="web">
<person-group person-group-type="author">
<name>
<surname>McCormick</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Joseph</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Medicalrisk: Medical Risk and Comorbidity Tools for ICD-9-CM Data</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://CRAN.R-project.org/package=medicalrisk">https://CRAN.R-project.org/package&#x3d;medicalrisk</ext-link>
</comment> (<comment>Accessed August 13, 2020</comment>). </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miotto</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Kidd</surname>
<given-names>B. A.</given-names>
</name>
<name>
<surname>Dudley</surname>
<given-names>J.&#x20;T.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Deep Patient: An Unsupervised Representation to Predict the Future of Patients from the Electronic Health Records</article-title>. <source>Sci. Rep.</source> <volume>6</volume>, <fpage>26094</fpage>. <pub-id pub-id-type="doi">10.1038/srep26094</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Miotto</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Dudley</surname>
<given-names>J.&#x20;T.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Deep Learning for Healthcare: Review, Opportunities and Challenges</article-title>. <source>Brief. Bioinform.</source> <volume>19</volume> (<issue>6</issue>), <fpage>1236</fpage>&#x2013;<lpage>1246</lpage>. <pub-id pub-id-type="doi">10.1093/bib/bbx044</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Noh</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Yoo</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Bae</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J.&#x20;S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>J.-H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Prediction of the Mortality Risk in Peritoneal Dialysis Patients Using Machine Learning Models: A Nation-wide Prospective Cohort in Korea</article-title>. <source>Sci. Rep.</source> <volume>10</volume> (<issue>1</issue>), <fpage>7470</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-64184-0</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Onderwater</surname>
<given-names>G. L. J.</given-names>
</name>
<name>
<surname>Ligthart</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Bot</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Demirkan</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>van der Kallen</surname>
<given-names>C. J.&#x20;H.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Large-scale Plasma Metabolome Analysis Reveals Alterations in HDL Metabolism in Migraine</article-title>. <source>Neurology</source> <volume>92</volume> (<issue>16</issue>), <fpage>e1899</fpage>&#x2013;<lpage>e1911</lpage>. <pub-id pub-id-type="doi">10.1212/WNL.0000000000007313</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ottman</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lipton</surname>
<given-names>R. B.</given-names>
</name>
<name>
<surname>Ettinger</surname>
<given-names>A. B.</given-names>
</name>
<name>
<surname>Cramer</surname>
<given-names>J.&#x20;A.</given-names>
</name>
<name>
<surname>Reed</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Morrison</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2011</year>). <article-title>Comorbidities of Epilepsy: Results from the Epilepsy Comorbidities and Health (EPIC) Survey</article-title>. <source>Epilepsia</source> <volume>52</volume> (<issue>2</issue>), <fpage>308</fpage>&#x2013;<lpage>315</lpage>. <pub-id pub-id-type="doi">10.1111/j.1528-1167.2010.02927.x</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Park</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Cho</surname>
<given-names>H. E.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Wall</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Stern</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Machine Learning Prediction of Incidence of Alzheimer&#x27;s Disease Using Large-Scale Administrative Health Data</article-title>. <source>Npj&#x20;Digit. Med.</source> <volume>3</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1038/s41746-020-0256-0</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Peissig</surname>
<given-names>P. L.</given-names>
</name>
<name>
<surname>Santos Costa</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Caldwell</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Rottscheit</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Berg</surname>
<given-names>R. L.</given-names>
</name>
<name>
<surname>Mendonca</surname>
<given-names>E. A.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Relational Machine Learning for Electronic Health Record-Driven Phenotyping</article-title>. <source>J.&#x20;Biomed. Inform.</source> <volume>52</volume>, <fpage>260</fpage>&#x2013;<lpage>270</lpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2014.07.007</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Quan</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sundararajan</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Halfon</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Fong</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Burnand</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Luthi</surname>
<given-names>J.-C.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>Coding Algorithms for Defining Comorbidities in ICD-9-CM and ICD-10 Administrative Data</article-title>. <source>Med. Care</source> <volume>43</volume> (<issue>11</issue>), <fpage>1130</fpage>&#x2013;<lpage>1139</lpage>. <pub-id pub-id-type="doi">10.1097/01.mlr.0000182534.19832.83</pub-id> </citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rajkomar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Oren</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>A. M.</given-names>
</name>
<name>
<surname>Hajaj</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hardt</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Scalable and Accurate Deep Learning with Electronic Health Records</article-title>. <source>Npj&#x20;Digital Med.</source> <volume>1</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1038/s41746-018-0029-1</pub-id> </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rist</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Tzourio</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kurth</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Associations between Lipid Levels and Migraine: Cross-Sectional Analysis in the Epidemiology of Vascular Ageing Study</article-title>. <source>Cephalalgia</source> <volume>31</volume> (<issue>14</issue>), <fpage>1459</fpage>&#x2013;<lpage>1465</lpage>. <pub-id pub-id-type="doi">10.1177/0333102411421682</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rogers</surname>
<given-names>F. B.</given-names>
</name>
</person-group> (<year>1963</year>). <article-title>Medical Subject Headings</article-title>, <source>Bull. Med. Libr. Assoc.</source>, <volume>51</volume>, <fpage>114</fpage>&#x2013;<lpage>116</lpage>. </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Romano</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Roos</surname>
<given-names>L. L.</given-names>
</name>
<name>
<surname>Jollis</surname>
<given-names>J.&#x20;G.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Presentation Adapting a Clinical Comorbidity Index for Use with ICD-9-CM Administrative Data: Differing Perspectives</article-title>. <source>J.&#x20;Clin. Epidemiol.</source> <volume>46</volume> (<issue>10</issue>), <fpage>1075</fpage>&#x2013;<lpage>1079</lpage>. <pub-id pub-id-type="doi">10.1016/0895-4356(93)90103-8</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sachdev</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Marmura</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Metabolic Syndrome and Migraine</article-title>. <source>Front. Neur.</source> <volume>3</volume>. <pub-id pub-id-type="doi">10.3389/fneur.2012.00161</pub-id> </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schneeweiss</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>P. S.</given-names>
</name>
<name>
<surname>Avorn</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Glynn</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>Improved Comorbidity Adjustment for Predicting Mortality in Medicare Populations</article-title>. <source>Health Serv. Res.</source> <volume>38</volume> (<issue>4</issue>), <fpage>1103</fpage>&#x2013;<lpage>1120</lpage>. <pub-id pub-id-type="doi">10.1111/1475-6773.00165</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Seidenberg</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Pulsipher</surname>
<given-names>D. T.</given-names>
</name>
<name>
<surname>Hermann</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Association of Epilepsy and Comorbid Conditions</article-title>. <source>Future Neurol.</source> <volume>4</volume> (<issue>5</issue>), <fpage>663</fpage>&#x2013;<lpage>668</lpage>. <pub-id pub-id-type="doi">10.2217/fnl.09.32</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sessler</surname>
<given-names>D. I.</given-names>
</name>
<name>
<surname>Sigl</surname>
<given-names>J.&#x20;C.</given-names>
</name>
<name>
<surname>Manberg</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Kelley</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Schubert</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Chamoun</surname>
<given-names>N. G.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Broadly Applicable Risk Stratification System for Predicting Duration of Hospitalization and Mortality</article-title>. <source>The J.&#x20;Am. Soc. Anesthesiologists</source> <volume>113</volume> (<issue>5</issue>), <fpage>1026</fpage>&#x2013;<lpage>1037</lpage>. <pub-id pub-id-type="doi">10.1097/ALN.0b013e3181f79a8d</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sigakis</surname>
<given-names>M. J.&#x20;G.</given-names>
</name>
<name>
<surname>Bittner</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Wanderer</surname>
<given-names>J.&#x20;P.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Validation of a Risk Stratification Index and Risk Quantification Index for Predicting Patient Outcomes</article-title>. <source>Anesthesiology</source> <volume>119</volume> (<issue>3</issue>), <fpage>525</fpage>&#x2013;<lpage>540</lpage>. <pub-id pub-id-type="doi">10.1097/ALN.0b013e31829ce6e6</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Silberstein</surname>
<given-names>S. D.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Topiramate in Migraine Prevention: A 2016 Perspective</article-title>. <source>Headache</source>, <volume>57</volume> (<issue>1</issue>), <fpage>165</fpage>&#x2013;<lpage>178</lpage>. <pub-id pub-id-type="doi">10.1111/head.12997</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Spritzer</surname>
<given-names>S. D.</given-names>
</name>
<name>
<surname>Bravo</surname>
<given-names>T. P.</given-names>
</name>
<name>
<surname>Drazkowski</surname>
<given-names>J.&#x20;F.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Topiramate for Treatment in Patients with Migraine and Epilepsy</article-title>. <source>Headache</source> <volume>56</volume> (<issue>6</issue>), <fpage>1081</fpage>&#x2013;<lpage>1085</lpage>. <pub-id pub-id-type="doi">10.1111/head.12826</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thesmar</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Sraer</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Pinheiro</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Dadson</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Veliche</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Greenberg</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Combining the Power of Artificial Intelligence with the Richness of Healthcare Claims Data: Opportunities and Challenges</article-title>. <source>PharmacoEconomics</source> <volume>37</volume> (<issue>6</issue>), <fpage>745</fpage>&#x2013;<lpage>752</lpage>. <pub-id pub-id-type="doi">10.1007/s40273-019-00777-6</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>1996</year>). <article-title>Regression Shrinkage and Selection via the Lasso</article-title>. <source>J.&#x20;R. Stat. Soc. Ser. B (Methodological)</source> <volume>58</volume> (<issue>1</issue>), <fpage>267</fpage>&#x2013;<lpage>288</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Uno</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Pencina</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>D&#x27;Agostino</surname>
<given-names>R. B.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>L. J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>On the C-Statistics for Evaluating Overall Adequacy of Risk Prediction Procedures with Censored Survival Data</article-title>. <source>Statist. Med.</source> <volume>30</volume> (<issue>10</issue>), <fpage>1105</fpage>&#x2013;<lpage>1117</lpage>. <pub-id pub-id-type="doi">10.1002/sim.4154</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Valade</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Les avanc&#xe9;es dans les traitements de crise et de fond de la maladie migraineuse</article-title>. <source>Biologie Aujourd&#x27;hui</source> <volume>213</volume> (<issue>1&#x2013;2</issue>), <fpage>59</fpage>&#x2013;<lpage>64</lpage>. <pub-id pub-id-type="doi">10.1051/jbio/2019021</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Verrotti</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mazzocchetti</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Beyond Seizures - the Importance of Comorbidities in Epilepsy</article-title>. <source>Nat. Rev. Neurol.</source> <volume>12</volume> (<issue>10</issue>), <fpage>559</fpage>&#x2013;<lpage>560</lpage>. <pub-id pub-id-type="doi">10.1038/nrneurol.2016.135</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Victor</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Campbell</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Buse</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Lipton</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Migraine Prevalence by Age and Sex in the United&#x20;States: A Life-Span Study</article-title>. <source>Cephalalgia</source> <volume>30</volume> (<issue>9</issue>), <fpage>1065</fpage>&#x2013;<lpage>1072</lpage>. <pub-id pub-id-type="doi">10.1177/0333102409355601</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Weiss</surname>
<given-names>J.&#x20;C.</given-names>
</name>
<name>
<surname>Natarajan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Peissig</surname>
<given-names>P. L.</given-names>
</name>
<name>
<surname>McCarty</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Page</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Machine Learning for Personalized Medicine: Predicting Primary Myocardial Infarction from Electronic Health Records</article-title>. <source>AIMag</source> <volume>33</volume> (<issue>4</issue>), <fpage>33</fpage>. <pub-id pub-id-type="doi">10.1609/aimag.v33i4.2438</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wright</surname>
<given-names>M. N.</given-names>
</name>
<name>
<surname>Ziegler</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Ranger: A Fast Implementation of Random Forests for High Dimensional Data in C&#x2b;&#x2b; and R</article-title>. <source>J.&#x20;Stat. Soft.</source> <volume>77</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>17</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v077.i01</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xiao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Opportunities and Challenges in Developing Deep Learning Models Using Electronic Health Records Data: a Systematic Review</article-title>. <source>J.&#x20;Am. Med. Inform. Assoc.</source> <volume>25</volume> (<issue>10</issue>), <fpage>1419</fpage>&#x2013;<lpage>1428</lpage>. <pub-id pub-id-type="doi">10.1093/jamia/ocy068</pub-id> </citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zaccara</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Neurological Comorbidity and Epilepsy: Implications for Treatment</article-title>. <source>Acta Neurol. Scand.</source> <volume>120</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>15</lpage>. <pub-id pub-id-type="doi">10.1111/j.1600-0404.2008.01146.x</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zou</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Regularization and Variable Selection via the Elastic Net</article-title>. <source>J.&#x20;R. Stat. Soc B.</source> <volume>67</volume> (<issue>2</issue>), <fpage>301</fpage>&#x2013;<lpage>320</lpage>. <pub-id pub-id-type="doi">10.1111/j.1467-9868.2005.00503.x</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>