<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<?covid-19-tdm?>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Artif. Intell.</journal-id>
<journal-title>Frontiers in Artificial Intelligence</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Artif. Intell.</abbrev-journal-title>
<issn pub-type="epub">2624-8212</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">673527</article-id>
<article-id pub-id-type="doi">10.3389/frai.2021.673527</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Artificial Intelligence</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Symptom Prediction and Mortality Risk Calculation for COVID-19 Using Machine Learning</article-title>
<alt-title alt-title-type="left-running-head">Jamshidi et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">AI for COVID-19 Symptom and Mortality Prediction</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Jamshidi</surname>
<given-names>Elham</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1029359/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Asgary</surname>
<given-names>Amirhossein</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Tavakoli</surname>
<given-names>Nader</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="fn" rid="fn1">
<sup>&#x2020;</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Zali</surname>
<given-names>Alireza</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Dastan</surname>
<given-names>Farzaneh</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Daaee</surname>
<given-names>Amir</given-names>
</name>
<xref ref-type="aff" rid="aff5">
<sup>5</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Badakhshan</surname>
<given-names>Mohammadtaghi</given-names>
</name>
<xref ref-type="aff" rid="aff6">
<sup>6</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Esmaily</surname>
<given-names>Hadi</given-names>
</name>
<xref ref-type="aff" rid="aff4">
<sup>4</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1309196/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jamaldini</surname>
<given-names>Seyed Hamid</given-names>
</name>
<xref ref-type="aff" rid="aff7">
<sup>7</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Safari</surname>
<given-names>Saeid</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1127233/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Bastanhagh</surname>
<given-names>Ehsan</given-names>
</name>
<xref ref-type="aff" rid="aff8">
<sup>8</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Maher</surname>
<given-names>Ali</given-names>
</name>
<xref ref-type="aff" rid="aff9">
<sup>9</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Babajani</surname>
<given-names>Amirhesam</given-names>
</name>
<xref ref-type="aff" rid="aff10">
<sup>10</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/964533/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mehrazi</surname>
<given-names>Maryam</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sendani Kashi</surname>
<given-names>Mohammad Ali</given-names>
</name>
<xref ref-type="aff" rid="aff11">
<sup>11</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Jamshidi</surname>
<given-names>Masoud</given-names>
</name>
<xref ref-type="aff" rid="aff12">
<sup>12</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1310277/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sendani</surname>
<given-names>Mohammad Hassan</given-names>
</name>
<xref ref-type="aff" rid="aff13">
<sup>13</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Rahi</surname>
<given-names>Sahand Jamal</given-names>
</name>
<xref ref-type="aff" rid="aff14">
<sup>14</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Mansouri</surname>
<given-names>Nahal</given-names>
</name>
<xref ref-type="aff" rid="aff15">
<sup>15</sup>
</xref>
<xref ref-type="aff" rid="aff16">
<sup>16</sup>
</xref>
<xref ref-type="aff" rid="aff17">
<sup>17</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/981173/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<label>
<sup>1</sup>
</label>Functional Neurosurgery Research Center, Shohada Tajrish Comprehensive Neurosurgical Center of Excellence, Shahid Beheshti University of Medical Sciences, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff2">
<label>
<sup>2</sup>
</label>Department of Biotechnology, College of Sciences, University of Tehran, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff3">
<label>
<sup>3</sup>
</label>Trauma and Injury Research Center, Iran University of Medical Sciences, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff4">
<label>
<sup>4</sup>
</label>Department of Clinical Pharmacy, School of Pharmacy, Shahid Beheshti University of Medical Sciences, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff5">
<label>
<sup>5</sup>
</label>School of Mechanical Engineering, Sharif University of Technology, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff6">
<label>
<sup>6</sup>
</label>School of Electrical and Computer Engineering, Engineering Faculty, University of Tehran, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff7">
<label>
<sup>7</sup>
</label>Department of Genetic, Faculty of Advanced Science and Technology, Tehran Medical Sciences, Islamic Azad University, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff8">
<label>
<sup>8</sup>
</label>Department of Anesthesiology, Tehran University of Medical Sciences, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff9">
<label>
<sup>9</sup>
</label>School of Management and Medical Education, Shahid Beheshti University of Medical Sciences, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff10">
<label>
<sup>10</sup>
</label>Department of Pharmacology, School of Medicine, Shahid Beheshti University of Medical Sciences, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff11">
<label>
<sup>11</sup>
</label>Department of Business Management, Faculty of Management, University of Tehran, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff12">
<label>
<sup>12</sup>
</label>Department of Exercise Physiology, Tehran University, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff13">
<label>
<sup>13</sup>
</label>Department of Computer Engineering, Sharif University of Technology, <addr-line>Tehran</addr-line>, <country>Iran</country>
</aff>
<aff id="aff14">
<label>
<sup>14</sup>
</label>Laboratory of the Physics of Biological Systems, Institute of Physics, &#xc9;cole Polytechnique F&#xe9;d&#xe9;rale de Lausanne (EPFL), <addr-line>Lausanne</addr-line>, <country>Switzerland</country>
</aff>
<aff id="aff15">
<label>
<sup>15</sup>
</label>Division of Pulmonary Medicine, Department of Medicine, Lausanne University Hospital (CHUV), University of Lausanne (UNIL), <addr-line>Lausanne</addr-line>, <country>Switzerland</country>
</aff>
<aff id="aff16">
<label>
<sup>16</sup>
</label>Swiss Institute for Experimental Cancer Research (ISREC), School of Life Sciences, &#xc9;cole Polytechnique F&#xe9;d&#xe9;rale de Lausanne (EPFL), <addr-line>Lausanne</addr-line>, <country>Switzerland</country>
</aff>
<aff id="aff17">
<label>
<sup>17</sup>
</label>Research Group on Artificial Intelligence in Pulmonary Medicine, Division of Pulmonary Medicine, Lausanne University Hospital (CHUV), <addr-line>Lausanne</addr-line>, <country>Switzerland</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/928677/overview">Hong Qin</ext-link>, University of Tennessee at Chattanooga, United&#x20;States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1249595/overview">Ziwei Ma</ext-link>, University of Tennessee at Chattanooga, United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1295452/overview">Feng Liu</ext-link>, Stevens Institute of Technology, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Nahal Mansouri, <email>nahal.mansouri@chuv.ch</email>; Sahand Jamal Rahi, <email>sahand.rahi@epfl.ch</email>
</corresp>
<fn fn-type="equal" id="fn1">
<label>
<sup>&#x2020;</sup>
</label>
<p>These authors have contributed equally to this&#x20;work</p>
</fn>
<fn fn-type="other">
<p>This article was submitted to Medicine and Public Health, a section of the journal Frontiers in Artificial Intelligence</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>06</month>
<year>2021</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>4</volume>
<elocation-id>673527</elocation-id>
<history>
<date date-type="received">
<day>27</day>
<month>02</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>14</day>
<month>05</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2021 Jamshidi, Asgary, Tavakoli, Zali, Dastan, Daaee, Badakhshan, Esmaily, Jamaldini, Safari, Bastanhagh, Maher, Babajani, Mehrazi, Sendani Kashi, Jamshidi, Sendani, Rahi and Mansouri.</copyright-statement>
<copyright-year>2021</copyright-year>
<copyright-holder>Jamshidi, Asgary, Tavakoli, Zali, Dastan, Daaee, Badakhshan, Esmaily, Jamaldini, Safari, Bastanhagh, Maher, Babajani, Mehrazi, Sendani Kashi, Jamshidi, Sendani, Rahi and Mansouri</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>
<bold>Background:</bold> Early prediction of symptoms and mortality risks for COVID-19 patients would improve healthcare outcomes, allow for the appropriate distribution of healthcare resources, reduce healthcare costs, aid in vaccine prioritization and self-isolation strategies, and thus reduce the prevalence of the disease. Such publicly accessible prediction models are lacking, however.</p>
<p>
<bold>Methods:</bold> Based on a comprehensive evaluation of existing machine learning (ML) methods, we created two models based solely on the age, gender, and medical histories of 23,749&#x20;hospital-confirmed COVID-19 patients from February to September 2020: a symptom prediction model (SPM) and a mortality prediction model (MPM). The SPM predicts 12 symptom groups for each patient: respiratory distress, consciousness disorders, chest pain, paresis or paralysis, cough, fever or chill, gastrointestinal symptoms, sore throat, headache, vertigo, loss of smell or taste, and muscular pain or fatigue. The MPM predicts the death of COVID-19-positive individuals.</p>
<p>
<bold>Results:</bold> The SPM yielded ROC-AUCs of 0.53&#x2013;0.78 for symptoms. The most accurate prediction was for consciousness disorders at a sensitivity of 74% and a specificity of 70%. 2,440 deaths were observed in the study population. MPM had a ROC-AUC of 0.79 and could predict mortality with a sensitivity of 75% and a specificity of 70%. About 90% of deaths occurred in the top 21 percentile of risk groups. To allow patients and clinicians to use these models easily, we created a freely accessible online interface at <ext-link ext-link-type="uri" xlink:href="http://www.aicovid.org/">www.aicovid.net</ext-link>.</p>
<p>
<bold>Conclusion:</bold> The ML models predict COVID-19-related symptoms and mortality using information that is readily available to patients as well as clinicians. Thus, both can rapidly estimate the severity of the disease, allowing shared and better healthcare decisions with regard to hospitalization, self-isolation strategy, and COVID-19 vaccine prioritization in the coming months.</p>
</abstract>
<kwd-group>
<kwd>COVID-19</kwd>
<kwd>artificial intelligence</kwd>
<kwd>machine learning</kwd>
<kwd>symptom</kwd>
<kwd>mortality</kwd>
</kwd-group>
<contract-sponsor id="cn001">&#xc9;cole Polytechnique F&#xe9;d&#xe9;rale de Lausanne<named-content content-type="fundref-id">10.13039/501100001703</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>The COVID-19 pandemic of the 2019 novel coronavirus (SARS-CoV-2) started in December 2019 and is spreading rapidly, with approximately 62.5&#xa0;million confirmed cases and 1.5&#xa0;million deaths by the end of November 2020 (<xref ref-type="bibr" rid="B27">WHO, 2020</xref>).</p>
<p>The severity of the disease varies widely between different patients, ranging from no symptoms to a mild flu-like illness, to severe respiratory symptoms, and to multi-organ failure leading to death. Among the symptoms, fever, cough, and respiratory distress are more prevalent than symptoms such as consciousness disorders and loss of smell and taste (<xref ref-type="bibr" rid="B23">Tabata et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B15">Jamshidi et&#x20;al., 2021b</xref>). In general, complications are common among elderly patients and those with pre-existing conditions. The intensive care unit (ICU) admission rate is substantially higher for these groups (<xref ref-type="bibr" rid="B1">Abate et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B14">Jamshidi et&#x20;al., 2021a</xref>).</p>
<p>The Center for Disease Control (CDC) and the World Health Organization (WHO) consider the identification of individuals at higher risk a top priority. This identification could be used for numerous solutions to moderate the consequences of the pandemic for the most vulnerable (<xref ref-type="bibr" rid="B24">CDC COVID-19 Response Team, 2020</xref>) as well as minimize the presence of actively ill patients in society.</p>
<p>This requires the prediction of the symptoms and mortality risk for infected individuals. While symptom prediction models exist for cancer, no such models have been designed for COVID-19 (<xref ref-type="bibr" rid="B17">Levitsky et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B11">Goecks et&#x20;al., 2020</xref>). To make rapid, evidence-based decisions possible, they will ideally be based on readily available patient information, i.e.,&#x20;demographic attributes and past medical history (PMH) as opposed to costly laboratory tests. Early decision-making is critical for timely triage and clinical management of patients. For instance, clinical and laboratory data can only be assessed after presenting the individual to a health care center, increasing the risk of unnecessary exposures to the virus and increasing costs (<xref ref-type="bibr" rid="B22">Sun et&#x20;al., 2020</xref>). These parameters are not available immediately and are partly subject to human error. Also, factors like genetic predisposition may increase the models&#x2019; accuracy but are not broadly available.</p>
<p>With the growth of big data in healthcare and the introduction of electronic health records, artificial intelligence (AI) algorithms can be integrated into hospital IT systems and have shown promise as computer-aided diagnosis and prognostic tools. In the era of COVID-19, AI has played an essential role in the early diagnosis of infection, the prognosis of hospitalized patients, contact tracing for spread control, and drug discovery (<xref ref-type="bibr" rid="B16">Lalmuanawma et&#x20;al., 2020</xref>). AI methods can have a higher accuracy over classical statistical analyses.</p>
<p>In contrast to the few previously available COVID-19 risk scales, our mortality prediction model uses a selection of variables that are in principle accessible to all patients and thus can be used immediately after diagnosis (<xref ref-type="bibr" rid="B3">Assaf et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B19">Pan et&#x20;al., 2020</xref>). This model not only has a significant benefit in early decision making in the hospital setting, but because it does not require clinicians or laboratories, it can serve as a triage tool for patients in an outpatient setting, in telemedicine, or as a self-assessment tool. For example, decisions on outpatient vs. inpatient care can be made remotely by estimating the most probable symptoms and severity risks. This lessens the strain on health care resources, unnecessary costs, and unwanted exposures to infected patients.</p>
<p>Here, we implemented 2&#xa0;ML methods to predict the symptoms and the mortality of patients with COVID-19. Overall, 23,749 patients were included in the study. The predictors used for the models were age, sex, and PMH of the patients. Both of these models achieved predictions with high accuracy. To our knowledge, this is one of the largest datasets of COVID-19 cases and is the only study that uses patient-available data for the prediction of COVID-19 symptoms and mortality. Furthermore, this study is the most extensive study for mortality prediction for COVID-19 using ML-based on any set of predictors (<xref ref-type="bibr" rid="B2">An et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B9">Gao et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B25">Vaid et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B29">Yadaw et&#x20;al., 2020</xref>).</p>
<p>We also created an online calculator where each individual can predict their COVID-19 related symptoms and risk (<ext-link ext-link-type="uri" xlink:href="http://www.aicovid.org/">www.aicovid.net</ext-link>).</p>
<p>For a standardized representation of the methodology and results of this analysis an adapted version of the Transparent Reporting of Multivariable Prediction Model for Individual Prognosis or Diagnosis (TRIPOD) guideline was followed (<xref ref-type="bibr" rid="B6">Collins et&#x20;al., 2015</xref>).</p>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec id="s2-1">
<title>Source of Data and Participants</title>
<p>In this cohort study, we used the Hospital Information System (HIS) of 74 secondary and tertiary care hospitals across Tehran, Iran. The eligibility criteria were defined as confirmed or suspected SARS-CoV-2 infections of people aged 18&#x2013;100&#xa0;years registered in the referred HIS. The final database used to design the models was obtained by aggregating the 74 hospitals&#x2019; HIS. The study included patients referred to any of the hospitals between February 1, 2020, and September 30, 2020. Patients were followed up through October 2020 until all the registered patients had the specific death or survival outcome needed for the mortality prediction model (MPM). This study was approved by the Iran University of Medical Sciences Ethics Committee.</p>
</sec>
<sec id="s2-2">
<title>Outcome</title>
<sec id="s2-2-1">
<title>Symptom Prediction Model</title>
<p>The patients&#x2019; symptoms at the time of admission, as recorded in the HIS, were considered as the outputs of the Symptom Prediction Model (SPM). All stated symptoms were clustered in 12 categories to be predicted by the model. The groups are cough, loss of smell or taste, respiratory distress, vertigo, muscular pain or fatigue, sore throat, fever or chill, paresis or paralysis, gastrointestinal problems, headache, chest pain, and consciousness disorders.</p>
</sec>
</sec>
<sec id="s2-3">
<title>Mortality Prediction Model</title>
<p>Death or survival as per the HIS records was defined as the output of the mortality prediction model (MPM).</p>
</sec>
<sec id="s2-4">
<title>Predictors</title>
<p>The patients&#x2019; age, sex, and past medical history (PMH), as detailed in <xref ref-type="table" rid="T1">Table&#x20;1</xref>, were used as predictors for both models. The selection of variables as predictors was based on the available recorded data. All these predictors were recorded in the HIS at the time of admission.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>List of predictors<bold>.</bold> Predictor variables for mortality risk and symptom prediction of COVID-19.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Category</th>
<th align="center">Variable</th>
<th align="center">Description</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="left">Demographic</td>
<td align="left">Age</td>
<td align="left">In years</td>
</tr>
<tr>
<td align="left">Sex</td>
<td align="left">Male or female</td>
</tr>
<tr>
<td rowspan="13" align="left">Past/Current Medical Conditions</td>
<td align="left">
<italic>Cancer</italic>
</td>
<td align="left">Current chemotherapy, radiotherapy, immunotherapy, bone marrow or stem cell transplantation</td>
</tr>
<tr>
<td align="left">Liver disorders</td>
<td align="left">Chronic hepatitis (type B or C), alcohol-related liver disease, primary biliary cirrhosis, primary sclerosing cholangitis, hemochromatosis, cirrhosis</td>
</tr>
<tr>
<td align="left">Blood disorders</td>
<td align="left">Anemia (iron deficiency, thalassemia minor and major, sickle cell disease), coagulopathies (hemophilia and platelet disorders)</td>
</tr>
<tr>
<td align="left">Immune disorders</td>
<td align="left">Immune deficiency (acquired immunodeficiency syndrome, treatment with steroids and immune suppressors), autoimmune disease (rheumatoid arthritis, systemic lupus erythematosus, ankylosing spondylitis, vasculitis).</td>
</tr>
<tr>
<td align="left">Cardiovascular disease</td>
<td align="left">Congestive heart failure, cardiovascular events (myocardial infarction, stroke, angina), valvular heart disease, arrhythmia (e.g. atrial fibrillation)</td>
</tr>
<tr>
<td align="left">Kidney disorders</td>
<td align="left">Chronic kidney disease (stage 3, 4, and end-stage renal disease)</td>
</tr>
<tr>
<td align="left">Respiratory disorders</td>
<td align="left">Asthma, chronic obstructive pulmonary disease (emphysema and chronic bronchitis), extrinsic allergic alveolitis, cystic fibrosis, interstitial lung disease, sarcoidosis, bronchiectasis, pulmonary hypertension</td>
</tr>
<tr>
<td align="left">Neurological disorders</td>
<td align="left">Epilepsy, Parkinson&#x2019;s disease, motor neuron disease, cerebral palsy, dementia, multiple sclerosis</td>
</tr>
<tr>
<td align="left">Endocrine disorders</td>
<td align="left">Hyperthyroidism, hypothyroidism, cushing syndrome, pheochromocytoma, thyroiditis, hyperaldosteronism</td>
</tr>
<tr>
<td align="left">Diabetes mellitus</td>
<td align="left">Type 1 and type 2 diabetes, maturity onset diabetes of the young, insipidus, gestational diabetes</td>
</tr>
<tr>
<td align="left">Hypertension</td>
<td align="left">Primary and secondary</td>
</tr>
<tr>
<td align="left">Psychiatric disorders (removed due to low prevalence)</td>
<td align="left">Bipolar disorder, psychosis, schizophrenia, major depression disorder</td>
</tr>
<tr>
<td align="left">Thrombosis (removed due to low prevalence)</td>
<td align="left">Venous thromboembolism, pulmonary thromboembolism</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s2-5">
<title>Missing Data</title>
<p>We only included patients with the required data. Due to the absence of missing data, there was no imputation of missing values.</p>
</sec>
<sec id="s2-6">
<title>Pre-Processing</title>
<p>Symptoms and predictor variables from the medical histories with an incidence of less than 0.2% were removed to reduce noise. This removed past COVID-19 infections, thrombosis, psychiatric disorders, and organ or bone marrow transplantation from the set of predictor variables. The removed symptoms were tachycardia, seizure, nasal congestion, and skin problems.</p>
<p>Sex, PMH, and symptoms were encoded as binary variables. In training and test sets, the only continuous predictor, age, was standardized to zero mean and unit standard deviation.</p>
</sec>
<sec id="s2-7">
<title>Machine Learning Methods</title>
<p>To ensure generalizability, a 5-fold cross-validation algorithm was employed [Performance evaluation of classification algorithms by k-fold and leave-one-out cross validation, (<xref ref-type="bibr" rid="B28">Wong, 2015</xref>). All records were randomly separated into five independent subsets. Four subsets were used as training data, and one subset was retained as a validation set for model testing. The cross-validation process was then iterated four more times, with each of the five subsets being used as validation data exactly once. Subsequently, model performance metrics were evaluated for training and validation groups separately in each model iteration.</p>
<p>By separating deceased and surviving patients separately into five mortality-stratified subsets first and then combining these into the final five subsets, we maintained the same proportion of deceased and surviving patients in each of the final five subsets.</p>
<p>We evaluated several machine learning techniques for both models: Logistic Regression, Random Forest, Artificial Neural Network (ANN), K-Nearest Neighbors (KNN), Linear Discriminant Analysis (LDA), and Naive Bayes.</p>
<p>We took advantage of the Scikit-learn machine learning library to implement both preprocessing algorithms and models (<xref ref-type="bibr" rid="B10">Garreta and Moncecchi, 2013</xref>).</p>
</sec>
<sec id="s2-8">
<title>Symptom Prediction Model</title>
<p>The SPM output predicts symptoms for SARS-CoV-2 positive patients. Since there are 12 symptom groups, we judged the models&#x2019; overall performance by a single metric, the prevalence-weighted mean of the twelve ROC-AUCs (<xref ref-type="bibr" rid="B18">Mandrekar, 2010</xref>), in which the ROC-AUCs were weighted by symptom prevalence.</p>
</sec>
<sec id="s2-9">
<title>Mortality Prediction Model</title>
<p>The MPM calculates the probability of death for SARS-CoV-2 positive patients. Each model&#x2019;s performance was measured in terms of a ROC-AUC.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<sec id="s3-1">
<title>Participants</title>
<p>Baseline characteristics of patients and their symptoms are shown in <xref ref-type="table" rid="T2">Table&#x20;2</xref>. Of all 23,749 confirmed or suspected COVID-19 patients, 2,440 (10.27%) passed away at the end of the study (see <italic>Discussion</italic>). A comparison of the characteristics of survived and deceased patients is shown in <xref ref-type="table" rid="T3">Table&#x20;3</xref>. A comparison of the characteristics of patients with and without each symptom is shown in <xref ref-type="sec" rid="s10">Supplementary Tables S1&#x2013;S16</xref>.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Patient characteristics and symptoms. Baseline characteristics, symptoms, and death outcomes for COVID-19 patients.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="2" align="left">Continuous variables</th>
</tr>
<tr>
<th align="left">Variable</th>
<th align="center">Median (&#xb1;IQR)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Age</td>
<td align="center">52 (&#xb1;29)</td>
</tr>
<tr>
<td colspan="2" align="left">Categorical/Binary variables</td>
</tr>
<tr>
<td align="left">Variable</td>
<td align="center">Count (percent)</td>
</tr>
<tr>
<td colspan="2" align="left">Sex</td>
</tr>
<tr>
<td align="left">Male</td>
<td align="center">12,597 (53.04%)</td>
</tr>
<tr>
<td align="left">Female</td>
<td align="center">11,152 (46.96%)</td>
</tr>
<tr>
<td align="left">Cardiovascular disease</td>
<td align="center">2,471 (10.4%)</td>
</tr>
<tr>
<td align="left">Diabetes</td>
<td align="center">2,068 (8.71%)</td>
</tr>
<tr>
<td align="left">Hypertension</td>
<td align="center">2,004 (8.44%)</td>
</tr>
<tr>
<td align="left">Respiratory diseases</td>
<td align="center">546 (2.3%)</td>
</tr>
<tr>
<td align="left">Cancer</td>
<td align="center">477 (2.01%)</td>
</tr>
<tr>
<td align="left">Kidney disorders</td>
<td align="center">416 (1.75%)</td>
</tr>
<tr>
<td align="left">Neurological disorders</td>
<td align="center">264 (1.11%)</td>
</tr>
<tr>
<td align="left">Immune disorders</td>
<td align="center">178 (0.75%)</td>
</tr>
<tr>
<td align="left">Blood disorders</td>
<td align="center">152 (0.64%)</td>
</tr>
<tr>
<td align="left">Current pregnancy</td>
<td align="center">139 (0.59%)</td>
</tr>
<tr>
<td align="left">Liver disorders</td>
<td align="center">119 (0.5%)</td>
</tr>
<tr>
<td align="left">Endocrine disorders</td>
<td align="center">97 (0.41%)</td>
</tr>
<tr>
<td align="left">Organ or bone marrow transplant</td>
<td align="center">29 (0.12%)</td>
</tr>
<tr>
<td align="left">Mental illnesses</td>
<td align="center">19 (0.08%)</td>
</tr>
<tr>
<td align="left">Thrombosis</td>
<td align="center">15 (0.06%)</td>
</tr>
<tr>
<td align="left">Past COVID-19 infection</td>
<td align="center">10 (0.04%)</td>
</tr>
<tr>
<td colspan="2" align="left">Outcomes</td>
</tr>
<tr>
<td align="left">Survived</td>
<td align="center">21,309 (89.73%)</td>
</tr>
<tr>
<td align="left">Dead</td>
<td align="center">2,440 (10.27%)</td>
</tr>
<tr>
<td colspan="2" align="left">Symptoms</td>
</tr>
<tr>
<td align="left">Cough</td>
<td align="center">11,995 (50.51%)</td>
</tr>
<tr>
<td align="left">Respiratory distress</td>
<td align="center">10,342 (43.55%)</td>
</tr>
<tr>
<td align="left">Muscular pain or fatigue</td>
<td align="center">9,249 (38.94%)</td>
</tr>
<tr>
<td align="left">Fever or chill</td>
<td align="center">8,553 (36.01%)</td>
</tr>
<tr>
<td align="left">Gastrointestinal problems</td>
<td align="center">2,469 (10.4%)</td>
</tr>
<tr>
<td align="left">Headache</td>
<td align="center">1,120 (4.72%)</td>
</tr>
<tr>
<td align="left">Chest pain</td>
<td align="center">745 (3.14%)</td>
</tr>
<tr>
<td align="left">Consciousness disorders</td>
<td align="center">698 (2.94%)</td>
</tr>
<tr>
<td align="left">Loss of smell or taste</td>
<td align="center">659 (2.77%)</td>
</tr>
<tr>
<td align="left">Vertigo</td>
<td align="center">501 (2.11%)</td>
</tr>
<tr>
<td align="left">Sore throat</td>
<td align="center">157 (0.66%)</td>
</tr>
<tr>
<td align="left">Paresis or paralysis</td>
<td align="center">121 (0.51%)</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Comparison between survived and deceased patient groups. Comparative evaluation of the characteristics of survived and deceased COVID-19 patients.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="5" align="left">Continuous variables</th>
</tr>
<tr>
<th align="left">Variable</th>
<th align="center">Median in survivors (&#xb1;IQR)</th>
<th align="center">Median in deceased (&#xb1;IQR)</th>
<th align="center">F-test statistics</th>
<th align="center">F-test <italic>p</italic>-value</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Age</td>
<td align="center">49 (&#xb1;27)</td>
<td align="center">70 (&#xb1;21)</td>
<td align="center">2,039.47</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td colspan="5" align="left">Categorical/Binary variables</td>
</tr>
<tr>
<td align="left">Variable</td>
<td align="center">Count in survivors (percent in survivors)</td>
<td align="center">Count in deceased (percent in deceased)</td>
<td align="center">Chi2 statistics</td>
<td align="left">Chi2&#x20;<italic>p</italic>-value</td>
</tr>
<tr>
<td align="left">Sex</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left">Male</td>
<td align="center">11,163 (52.39%)</td>
<td align="center">1,434 (58.77%)</td>
<td align="center">16.82</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Female</td>
<td align="center">10,146 (47.61%)</td>
<td align="center">1,006 (41.23%)</td>
<td align="center">19</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Cardiovascular disease</td>
<td align="center">2,039 (9.57%)</td>
<td align="center">432 (17.7%)</td>
<td align="center">139.29</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Diabetes</td>
<td align="center">1,693 (7.94%)</td>
<td align="center">375 (15.37%)</td>
<td align="center">138.57</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Hypertension</td>
<td align="center">1,676 (7.87%)</td>
<td align="center">328 (13.44%)</td>
<td align="center">80.71</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Respiratory disorder<bold>s</bold>
</td>
<td align="center">462 (2.17%)</td>
<td align="center">84 (3.44%)</td>
<td align="center">15.47</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Cancer</td>
<td align="center">343 (1.61%)</td>
<td align="center">134 (5.49%)</td>
<td align="center">164.28</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Kidney disorders</td>
<td align="center">317 (1.49%)</td>
<td align="center">99 (4.06%)</td>
<td align="center">82.54</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Neurological disorders</td>
<td align="center">207 (0.97%)</td>
<td align="center">57 (2.34%)</td>
<td align="center">36.68</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Immune disorders</td>
<td align="center">152 (0.71%)</td>
<td align="center">26 (1.07%)</td>
<td align="center">3.62</td>
<td align="center">0.057</td>
</tr>
<tr>
<td align="left">Blood disorders</td>
<td align="center">112 (0.53%)</td>
<td align="center">40 (1.64%)</td>
<td align="center">42.43</td>
<td align="center">&#x3c;0.001</td>
</tr>
<tr>
<td align="left">Current pregnancy</td>
<td align="center">133 (0.62%)</td>
<td align="center">6 (0.25%)</td>
<td align="center">5.35</td>
<td align="center">0.021</td>
</tr>
<tr>
<td align="left">Liver disorders</td>
<td align="center">101 (0.47%)</td>
<td align="center">18 (0.74%)</td>
<td align="center">3.04</td>
<td align="center">0.081</td>
</tr>
<tr>
<td align="left">Endocrine disorders</td>
<td align="center">88 (0.41%)</td>
<td align="center">9 (0.37%)</td>
<td align="center">0.1</td>
<td align="center">0.747</td>
</tr>
<tr>
<td align="left">Organ or bone marrow transplant</td>
<td align="center">25 (0.12%)</td>
<td align="center">4 (0.16%)</td>
<td align="center">0.39</td>
<td align="center">0.533</td>
</tr>
<tr>
<td align="left">Psychiatric disorders</td>
<td align="center">16 (0.08%)</td>
<td align="center">3 (0.12%)</td>
<td align="center">0.63</td>
<td align="center">0.428</td>
</tr>
<tr>
<td align="left">Thrombosis</td>
<td align="center">13 (0.06%)</td>
<td align="center">2 (0.08%)</td>
<td align="center">0.15</td>
<td align="center">0.696</td>
</tr>
<tr>
<td align="left">Past COVID-19 infection</td>
<td align="center">10 (0.05%)</td>
<td align="center">0 (0.0%)</td>
<td align="center">1.15</td>
<td align="center">0.285</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>We used statistical hypothesis tests to demonstrate each predictor variable&#x2019;s significance to the model outputs. We employed the F-test (<xref ref-type="bibr" rid="B21">Snedecor, 1957</xref>) technique for age, a continuous variable, and the Chi-square (<xref ref-type="bibr" rid="B21">Snedecor, 1957</xref>) technique for other categorical variables such as sex and&#x20;PMH.</p>
</sec>
<sec id="s3-2">
<title>Model Specification</title>
<p>We evaluated six machine learning methods for both the SPM and MPM, which are listed, together with the hyperparameters used in <xref ref-type="table" rid="T4">Table&#x20;4</xref>.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Machine learning methods and hyperparameters&#x20;used.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th colspan="3" align="left">The Mortality Prediction Model</th>
</tr>
<tr>
<th align="left">Method</th>
<th align="center">Parameter</th>
<th align="center">Value(s)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Logistic Regression</td>
<td align="left">C</td>
<td align="center">1.0</td>
</tr>
<tr>
<td rowspan="3" align="left">Random Forest</td>
<td align="left">Number of trees</td>
<td align="center">500</td>
</tr>
<tr>
<td align="left">Min. Number of samples at a leaf node</td>
<td align="center">%0.1 of all samples</td>
</tr>
<tr>
<td align="left">Criterion</td>
<td align="center">Gini</td>
</tr>
<tr>
<td rowspan="3" align="left">Artificial Neural Networks</td>
<td align="left">Number of layers</td>
<td align="center">3</td>
</tr>
<tr>
<td align="left">Output space dimensionality for each layer</td>
<td align="center">32, 16, 1</td>
</tr>
<tr>
<td align="left">Activation function for each layer</td>
<td align="center">Tanh, tanh, sigmoid</td>
</tr>
<tr>
<td rowspan="2" align="left">K-Nearest Neighbors</td>
<td align="left">K</td>
<td align="center">10</td>
</tr>
<tr>
<td align="left">Weight function</td>
<td align="center">Distance</td>
</tr>
<tr>
<td align="left">Linear Discriminant Analysis</td>
<td align="left">Solver</td>
<td align="center">SVD</td>
</tr>
<tr>
<td align="left">Naive Bayes</td>
<td align="left">Interval size of age categories</td>
<td align="center">0.1</td>
</tr>
<tr>
<td colspan="3" align="left">The Symptom Prediction Model</td>
</tr>
<tr>
<td align="left">Method</td>
<td align="left">Parameter</td>
<td align="center">Value</td>
</tr>
<tr>
<td align="left">Logistic Regression</td>
<td align="left">C</td>
<td align="center">1.0</td>
</tr>
<tr>
<td rowspan="3" align="left">Random Forest</td>
<td align="left">Number of trees</td>
<td align="center">200</td>
</tr>
<tr>
<td align="left">Min. Number of samples at a leaf node</td>
<td align="center">%0.1 of all samples</td>
</tr>
<tr>
<td align="left">Criterion</td>
<td align="center">Gini</td>
</tr>
<tr>
<td rowspan="3" align="left">Artificial Neural Network</td>
<td align="left">Number of layers</td>
<td align="center">4</td>
</tr>
<tr>
<td align="left">Output space&#x2019;s dimensionality for each layer</td>
<td align="center">32, 32, 32, 12</td>
</tr>
<tr>
<td align="left">Activation function for each layer</td>
<td align="center">Tanh, tanh, tanh, tanh, sigmoid</td>
</tr>
<tr>
<td rowspan="2" align="left">K-Nearest Neighbors</td>
<td align="left">K</td>
<td align="center">5</td>
</tr>
<tr>
<td align="left">Weight function</td>
<td align="center">Distance</td>
</tr>
<tr>
<td align="left">Linear Discriminant Analysis</td>
<td align="left">Solver</td>
<td align="center">SVD</td>
</tr>
<tr>
<td align="left">Naive Bayes</td>
<td align="left">Interval size of age categories</td>
<td align="center">0.1</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-3">
<title>Model Performance</title>
<sec id="s3-3-1">
<title>Symptom Prediction Model</title>
<p>The SPM can be considered as 12 separated classifiers; each predicts the occurrence of a specific symptom. While the performance of each sub-classifier can be evaluated separately, the overall performance can be assessed using the prevalence-weighted mean of the ROC-AUCs, since the symptoms have different prevalence. The prevalence-weighted mean ROC-AUC for each method is illustrated in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>. Although the KNN method provided the highest weighted mean ROC-AUC for the test data, it was the least robust method since its performance varied considerably for different validation folds (note standard deviation bars). The Random Forest method achieved better overall performance and robustness. The weighted mean ROC-AUC value of this method was 0.582 for the test&#x20;data.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Prevalence-weighted means ROC-AUCs for different ML models. The models were used to implement the Symptom Prediction Model (SPM). Error bars denote the standard deviation over different cross-validation&#x20;folds.</p>
</caption>
<graphic xlink:href="frai-04-673527-g001.tif"/>
</fig>
<p>Moreover, the performance of the SPM can be evaluated for each symptom separately. The ROC-AUC values for predicting consciousness disorder, paresis or paralysis, and chest pain were 0.785, 0.729, and 0.686, respectively. Also, at a specificity of 70%, the sensitivities were 73%, 50%, and 53%, respectively.</p>
<p>As shown in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>, the random forest model with a mean ROC-AUC of 0.8 and 0.79 has the highest efficiency in the training and the validation groups, respectively, followed by the Neural Network and LDA. In the symptom prediction model, the ROC-AUC values of all models in addition to the weighted average of ROC-AUC of different ML methods for each symptom are shown in <xref ref-type="sec" rid="s10">Supplementary Figure S1</xref>. <xref ref-type="sec" rid="s10">Supplementary Figure S2</xref> delineates each method&#x27;s performance for all symptoms as a Radar&#x20;chart.</p>
<p>Based on the ROC diagram and the information from the database, the other performance metrics of the other models were identified. In addition to the ROC-AUC of the risk prediction model, we calculated the sensitivity and the negative and positive predictive value (NPV and PPV respectively) for each model. The detailed results of all six algorithms for both MPM and SPM are shown in <xref ref-type="sec" rid="s10">Supplementary Tables S17 and&#x20;S18</xref>.</p>
<p>The calibration plot of the RF implementation for each symptom predictor (sub-classifier) is depicted in <xref ref-type="sec" rid="s10">Supplementary Figure S3</xref> which shows the calibration plot of the RF implementation of each symptom.</p>
</sec>
</sec>
<sec id="s3-4">
<title>Mortality Prediction Model</title>
<p>The ROC-AUC values for each method are depicted in <xref ref-type="fig" rid="F2">Figure&#x20;2</xref>. In the MPM classifier, the Random Forest method outperformed the other methods just as for the SPM. The achieved ROC-AUC value was 0.79 for the test&#x20;data.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>ROC-AUCs of different ML models which were used to implement the MPM. The Random Forest (RF) model outperformed the other approaches.</p>
</caption>
<graphic xlink:href="frai-04-673527-g002.tif"/>
</fig>
<p>
<xref ref-type="sec" rid="s10">Supplementary Figure S4</xref> shows ROC diagrams representing the true-positive rates vs. false-positive rates for each method used to implement the MPM. The calibration plot of the RF model is depicted in <xref ref-type="sec" rid="s10">Supplementary Figure S5</xref>. Calibration indications such as Mean Calibration Error are also shown in the <xref ref-type="sec" rid="s10">Supplementary Figure S5</xref> for different methods.</p>
</sec>
<sec id="s3-5">
<title>Model Input-Output Correlations</title>
<p>We used the Chi-square test and the F-test to evaluate the extent to which PMH, sex, or age predict the outputs of the SPM and MPM. The larger the values of these test values are for each predictor variable, the more the predictor variable is predictive of the output of the models. For categorical predictor variables (i.e.,&#x20;PMH and sex), the Chi-square hypothesis test was used. To evaluate the predictive value of a categorical variable, we examined whether it was more common in patients who died (MPM) or in patients with a particular symptom (SPM). For the only continuous variable (age), we used the F-test. To find the impact of age, we examined if the age median was higher in dead patients (MPM) or patients with a particular symptom (SPM).</p>
<p>For the SPM model, <xref ref-type="sec" rid="s10">Supplementary Figure S6</xref> shows how each factor in the PMH was correlated with each symptom using the Chi-square test. For example, patients with diabetes or cardiovascular disease were more likely to have consciousness disorders and chest pain in case of infection with COVID-19. The effect of age on each symptom is shown in <xref ref-type="sec" rid="s10">Supplementary Figure S7</xref> using the F-test. Older patients were more likely to develop symptoms such as respiratory distress and consciousness disorder but also less likely to develop symptoms such as muscular pain or fatigue.</p>
<p>In addition, for the MPM, the impact of each PMH on death is shown in <xref ref-type="sec" rid="s10">Supplementary Figure S8</xref>. In our analysis, cancer, cardiovascular disease, and diabetes have the greatest effects on the risk of death in patients with Covid 19; on the other hand, pregnancy or being female decreased the chances of death. The F-test statistic of age in the MPM model is 2,039.47, which explains the increase in mortality risk from&#x20;aging.</p>
<p>DeLong&#x27;s test shows the statistically significant difference between AUCs of models. The DeLong tests for the MPM and SPM predictions are shown through <xref ref-type="sec" rid="s10">Supplementary Figures S9&#x2013;S21</xref>.</p>
</sec>
<sec id="s3-6">
<title>Validation of the Model for Each Mortality Peak</title>
<p>For additional validation of our model, we evaluated the performance of the final random forest for MPM during the periods with the highest rate of mortality. The data corresponding to each available mortality peak (april, February, and September 2020) was selected from the validation dataset of each model, and the outcome (recovery or death of the patient) during each period was predicted by the model and shown as a ROC diagram (<xref ref-type="fig" rid="F3">Figure&#x20;3</xref>). Despite the variation of the AUC in the mortality peaks, the weighted average of the AUC values corresponding to each period was approximately equal to the average model yield for the entire data. We can conclude that the model continues to perform equally well during each mortality peak. The cause of the high yield in april could be explained by the large number of available samples which would allow the algorithm to learn more accurately.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>ROC chart for Prediction of RF models in different timelines<bold>.</bold> An indicator of model performance on validation dataset in the peak months of COVID-19 outbreak in Iran.</p>
</caption>
<graphic xlink:href="frai-04-673527-g003.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>Our objective in this study was to develop 2&#xa0;ML models to predict the mortality and symptoms of COVID-19-positive patients among the general population using age, gender, and comorbidities alone. These models can guide the design of measures to combat the COVID-19 pandemic. The prediction of vulnerability using the models allows people in different risk groups to take appropriate actions if they contract COVID-19. For example, people who fall into the low-risk group can start isolation sooner when the predicted symptoms appear and refer to a hospital only if the symptoms persist. As a result, the risk of disease spread and the pressure on the health care system from unnecessary hospital visits, costs, and psychological and physical stress to the medical staff could be reduced (<xref ref-type="bibr" rid="B7">Emanuel et&#x20;al., 2020</xref>). In contrast, people who are predicted to be at higher risk are recommended to seek medical care immediately. Predictions can speed up the treatment process and ultimately decrease mortality.</p>
<p>Our study has shown that multiple symptoms have strong correlations with different medical history factors. Symptoms can be either amplified or attenuated by health backgrounds; for instance, hypertension, diabetes, and respiratory and neurological disorders increased the chances of loss of smell or taste; however, pregnancy, cancer, higher age, cardiovascular disease, and liver, immune system, blood, and kidney disorders have attenuated the appearance of this symptom.</p>
<p>Due to the complexity of the COVID-19 pathogenesis, many clinical studies revealed contradictory results, for example, the effectiveness or ineffectiveness of remdisivir (<xref ref-type="bibr" rid="B4">Beigel et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B12">Goldman et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B26">Wang et&#x20;al., 2020</xref>). We hypothesize that the imbalance of mortality risks between the intervention and control groups could have been a problem in these studies. With the help of our model, such problems could be partially solved by equalizing the mortality baseline in different clinical groups.</p>
<p>Our AI models can also be beneficial for COVID-19 vaccine testing and prioritization strategies. The limited number of approved vaccines in the first months of the vaccination process and the potential shortages make vaccine prioritization inevitable. This prioritization would be more important for developing countries that do not have the resources to pre-order vaccines from multiple companies (<xref ref-type="bibr" rid="B20">Persad et&#x20;al., 2020</xref>). Having a mortality prediction tool for each individual could be a valuable tool for governments to decide on vaccines&#x27; allocation.</p>
<sec id="s4-1">
<title>Limitations</title>
<p>Since our dataset was collected by the HIS, it did not contain COVID-19 patients that did not refer to a hospital or had no major symptoms to be identified as infected. This could explain the high mortality rate in our and other studies (<xref ref-type="bibr" rid="B8">Fumagalli et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B13">Gue et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B29">Yadaw et&#x20;al., 2020</xref>). However, for a systematic study with few confounding variables, uniform data collection is essential, which can only be realistically ensured with hospital&#x20;data.</p>
<p>Also, other variables such as the viral load may be important but are difficult to measure and are not readily available. We opted for easily accessible predictor variables to allow the widespread use of the models.</p>
<p>One way to improve the models is to subgroup-specific factors in the medical history or specific symptoms further. The main reason for grouping factors and symptoms was the low prevalence of certain subsets in the dataset.</p>
<p>In conclusion, we evaluated 15 parameters (<xref ref-type="table" rid="T1">Table&#x20;1</xref>) for predicting the symptoms and the mortality risk of COVID-19 patients. The ML models trained in this study could help people quickly determine their mortality risk and the probable symptoms of the infection. These tools could aid patients, physicians, and governments with informed and shared decision-making.</p>
</sec>
</sec>
</body>
<back>
<sec id="s5">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s6">
<title>Ethics Statement</title>
<p>The studies involving human participants were reviewed and approved by Iran National Committee for Ethics in Biomedical Research. Written informed consent for participation was not required for this study in accordance with the national legislation and the institutional requirements.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>EJ: Conceptualization-Equal, Methodology-Equal, Project administration-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; AA: Conceptualization-Equal, Methodology-Equal, Project administration-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; NT: Conceptualization-Equal, Methodology-Equal, Project administration-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; AZ: Data curation-Equal, Investigation administration-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; FD: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; AD: Data curation-Equal, Investigation Equal, Writing-original draft-Equal, Writing-review and editing-Equal; MB: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; HE: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; SJ: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; SS: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; EB: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; AM: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; AB: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; MM: Data curation-Equal, Investigation-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; MS: Data curation-Equal, Investigation-Equal and Writing-original draft-Equal, Writing-review and editing-Equal; MJ: Data curation-Equal, Investigation-Equal and Writing-original draft-Equal; SJ: Conceptualization-Equal, Methodology-Equal, Project administration-Equal, Supervision-Equal, Writing-original draft-Equal, Writing-review and editing-Equal; NM: Conceptualization-Equal, Methodology-Equal, Project administration-Equal, Supervision-Equal, Writing-original draft-Equal, Writing-review and editing-Equal.</p>
</sec>
<sec id="s8">
<title>Funding</title>
<p>SJ thanks the &#xc9;cole polytechnique f&#xe9;d&#xe9;rale de Lausanne for generous support.</p>
</sec>
<sec sec-type="COI-statement" id="s9">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="s10">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/frai.2021.673527/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/frai.2021.673527/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<sec id="s11">
<title>Abbreviations</title>
<p>AI, artificial intelligence; COVID-19, coronavirus disease of 2019; intensive care unit, IQR; interquartile range, KS; Kolmogorov-Smirnov, LR; logistic regression, ML; machine learning, RF; random forest, RDW; red blood cell, distribution width; ROC, receiver operating characteristic; HIS, hospital information system.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abate</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Ali</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Mantfardo</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Basu</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Rate of Intensive Care Unit Admission and Outcomes Among Patients with Coronavirus: A Systematic Review and Meta-Analysis</article-title>. <source>PLoS One</source>. <volume>15</volume>, <fpage>e0235653</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0235653</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>An</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Lim</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>D.-W.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>Y. J.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S. W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Machine Learning Prediction for Mortality of Patients Diagnosed with COVID-19: a Nationwide Korean Cohort Study</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>1</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-75767-2</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Assaf</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Gutman</surname>
<given-names>Y. a.</given-names>
</name>
<name>
<surname>Neuman</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Segal</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Amit</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Gefen-Halevi</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Utilization of Machine-Learning Models to Accurately Predict the Risk for Critical COVID-19</article-title>. <source>Intern. Emerg. Med.</source> <volume>15</volume>, <fpage>1435</fpage>&#x2013;<lpage>1443</lpage>. <pub-id pub-id-type="doi">10.1007/s11739-020-02475-0</pub-id> </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beigel</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Tomashek</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Dodd</surname>
<given-names>L. E.</given-names>
</name>
<name>
<surname>Mehta</surname>
<given-names>A. K.</given-names>
</name>
<name>
<surname>Zingman</surname>
<given-names>B. S.</given-names>
</name>
<name>
<surname>Kalil</surname>
<given-names>A. C.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Remdesivir for the Treatment of Covid-19 - Final Report</article-title>. <source>N. Engl. J.&#x20;Med.</source> <volume>383</volume>, <fpage>1813</fpage>&#x2013;<lpage>1826</lpage>. <pub-id pub-id-type="doi">10.1056/nejmoa2007764</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<collab>CDC COVID-19 Response Team</collab> (<year>2020</year>). <article-title>Severe Outcomes Among Patients with Coronavirus Disease 2019 (COVID-19) - United&#x20;States, February 12-March 16, 2020</article-title>. <source>MMWR. Morb. Mortal. Wkly. Rep.</source> <volume>69</volume>(<issue>12</issue>), <fpage>343</fpage>&#x2013;<lpage>346</lpage>. <pub-id pub-id-type="doi">10.15585/mmwr.mm6912e2</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Reitsma</surname>
<given-names>J.&#x20;B.</given-names>
</name>
<name>
<surname>Altman</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Moons</surname>
<given-names>K. G.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Transparent Reporting of a Multivariable Prediction Model for Individual Prognosis or Diagnosis (TRIPOD): the TRIPOD Statement</article-title>. <source>Br. J.&#x20;Surg.</source> <volume>102</volume>, <fpage>148</fpage>&#x2013;<lpage>158</lpage>. <pub-id pub-id-type="doi">10.1002/bjs.9736</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emanuel</surname>
<given-names>E. J.</given-names>
</name>
<name>
<surname>Persad</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Upshur</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Thome</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Parker</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Glickman</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Fair Allocation of Scarce Medical Resources in the Time of Covid-19</article-title>. <source>N. Engl. J.&#x20;Med.</source> <volume>382</volume>, <fpage>2049</fpage>&#x2013;<lpage>2055</lpage>. <pub-id pub-id-type="doi">10.1056/nejmsb2005114</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fumagalli</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Rozzini</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Vannini</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Coccia</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Cesaroni</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Mazzeo</surname>
<given-names>F.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Clinical Risk Score to Predict In-Hospital Mortality in COVID-19 Patients: a Retrospective Cohort Study</article-title>. <source>BMJ&#x20;Open</source>. <volume>10</volume>, <fpage>e040729</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2020-040729</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>G.-Y.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>H.-Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>S.-Y.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>L.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Machine Learning Based Early Warning System Enables Accurate Mortality Risk Prediction for COVID-19</article-title>. <source>Nat. Commun.</source> <volume>11</volume>, <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-18684-2</pub-id> </citation>
</ref>
<ref id="B10">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Garreta</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Moncecchi</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2013</year>). <source>Learning Scikit-Learn: Machine Learning in Python</source>. <publisher-loc>Birmingham United Kingdom</publisher-loc>: <publisher-name>Packt Publishing Ltd</publisher-name>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goecks</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jalili</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Heiser</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Gray</surname>
<given-names>J.&#x20;W.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>How Machine Learning Will Transform Biomedicine</article-title>. <source>Cell</source> <volume>181</volume>, <fpage>92</fpage>&#x2013;<lpage>101</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2020.03.022</pub-id> </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goldman</surname>
<given-names>J.&#x20;D.</given-names>
</name>
<name>
<surname>Lye</surname>
<given-names>D. C. B.</given-names>
</name>
<name>
<surname>Hui</surname>
<given-names>D. S.</given-names>
</name>
<name>
<surname>Marks</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Bruno</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Montejano</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Remdesivir for 5 or 10&#x20;Days in Patients with Severe Covid-19</article-title>. <source>N. Engl. J.&#x20;Med.</source> <volume>383</volume>, <fpage>1827</fpage>&#x2013;<lpage>1837</lpage>. <pub-id pub-id-type="doi">10.1056/nejmoa2015301</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gue</surname>
<given-names>Y. X.</given-names>
</name>
<name>
<surname>Tennyson</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kanji</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Gorog</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Development of a Novel Risk Score to Predict Mortality in Patients Admitted to Hospital with COVID-19</article-title>. <source>Sci. Rep.</source> <volume>10</volume>, <fpage>1</fpage>&#x2013;<lpage>8</lpage>. <pub-id pub-id-type="doi">10.1038/s41598-020-78505-w</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jamshidi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Asgary</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tavakoli</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Zali</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Esmaily</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Jamaldini</surname>
<given-names>S. H.</given-names>
</name>
<etal/>
</person-group> (<year>2021a</year>). <article-title>Using Machine Learning to Predict Mortality for COVID-19 Patients on Day Zero in the ICU</article-title>. <source>bioRxiv</source>. <pub-id pub-id-type="doi">10.1101/2021.02.04.21251131</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jamshidi</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Babajani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Soltani</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Niknejad</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2021b</year>). <article-title>Proposed Mechanisms of Targeting COVID-19 by Delivering Mesenchymal Stem Cells and Their Exosomes to Damaged Organs</article-title>. <source>Stem Cel Rev Rep</source> <volume>17</volume>, <fpage>176</fpage>&#x2013;<lpage>192</lpage>. <pub-id pub-id-type="doi">10.1007/s12015-020-10109-3</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lalmuanawma</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hussain</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chhakchhuak</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Applications of Machine Learning and Artificial Intelligence for Covid-19 (SARS-CoV-2) Pandemic: A Review</article-title>. <source>Chaos, Solitons &#x26; Fractals</source>. <volume>139</volume>, <fpage>110059</fpage>. <pub-id pub-id-type="doi">10.1016/j.chaos.2020.110059</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Levitsky</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Pernemalm</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Bernhardson</surname>
<given-names>B.-M.</given-names>
</name>
<name>
<surname>Forshed</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>K&#xf6;lbeck</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Olin</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Early Symptoms and Sensations as Predictors of Lung Cancer: a Machine Learning Multivariate Model</article-title>. <source>Sci. Rep.</source> <volume>9</volume>, <fpage>16504</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-019-52915-x</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mandrekar</surname>
<given-names>J.&#x20;N.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Receiver Operating Characteristic Curve in Diagnostic Test Assessment</article-title>. <source>J.&#x20;Thorac. Oncol.</source> <volume>5</volume>, <fpage>1315</fpage>&#x2013;<lpage>1316</lpage>. <pub-id pub-id-type="doi">10.1097/jto.0b013e3181ec173d</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Su</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Prognostic Assessment of COVID-19 in the Intensive Care Unit by Machine Learning Methods: Model Development and Validation</article-title>. <source>J.&#x20;Med. Internet Res.</source> <volume>22</volume>, <fpage>e23128</fpage>. <pub-id pub-id-type="doi">10.2196/23128</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Persad</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Peek</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Emanuel</surname>
<given-names>E. J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Fairly Prioritizing Groups for Access to COVID-19 Vaccines</article-title>. <source>JAMA</source> <volume>324</volume>, <fpage>1601</fpage>. <pub-id pub-id-type="doi">10.1001/jama.2020.18513</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Snedecor</surname>
<given-names>G. W.</given-names>
</name>
</person-group> (<year>1957</year>). <article-title>Statistical Methods</article-title>. <source>Soil Sci.</source> <volume>83</volume>, <fpage>163</fpage>. <pub-id pub-id-type="doi">10.1097/00010694-195702000-00023</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Qiu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Lower Mortality of COVID-19 by Early Recognition and Intervention: Experience from Jiangsu Province</article-title>. <source>Ann. Intensive Care</source>. <volume>10</volume>, <fpage>33</fpage>. <pub-id pub-id-type="doi">10.1186/s13613-020-00650-2</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tabata</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Imai</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kawano</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ikeda</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kodama</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Miyoshi</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Clinical Characteristics of COVID-19 in 104 People with SARS-CoV-2 Infection on the Diamond Princess Cruise Ship: a Retrospective Analysis</article-title>. <source>Lancet Infect. Dis.</source> <volume>20</volume>, <fpage>1043</fpage>&#x2013;<lpage>1050</lpage>. <pub-id pub-id-type="doi">10.1016/s1473-3099(20)30482-5</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vaid</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Somani</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Russak</surname>
<given-names>A. J.</given-names>
</name>
<name>
<surname>De Freitas</surname>
<given-names>J.&#x20;K.</given-names>
</name>
<name>
<surname>Chaudhry</surname>
<given-names>F. F.</given-names>
</name>
<name>
<surname>Paranjpe</surname>
<given-names>I.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Machine Learning to Predict Mortality and Critical Events in a Cohort of Patients with COVID-19 in New York City: Model Development and Validation</article-title>. <source>J.&#x20;Med. Internet Res.</source> <volume>22</volume>, <fpage>e24018</fpage>. <pub-id pub-id-type="doi">10.2196/24018</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Remdesivir in Adults with Severe COVID-19: a Randomised, Double-Blind, Placebo-Controlled, Multicentre Trial</article-title>. <source>The Lancet</source>. <volume>395</volume>, <fpage>1569</fpage>&#x2013;<lpage>1578</lpage>. <pub-id pub-id-type="doi">10.1016/s0140-6736(20)31022-9</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="web">
<collab>WHO</collab> (<year>2020</year>). <article-title>WHO Coronavirus Disease (COVID-19) Dashboard</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://covid19.who.int">https://covid19.who.int</ext-link>
</comment> (<comment>Accessed December 2, 2020</comment>) </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wong</surname>
<given-names>T-T.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Performance Evaluation of Classification Algorithms by K-fold and Leave-One-Out Cross Validation</article-title>. <source>Pattern Recognit</source>. <volume>48</volume>, <fpage>2839</fpage>&#x2013;<lpage>2846</lpage>. <pub-id pub-id-type="doi">10.1016/j.patcog.2015.03.009</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yadaw</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y. C.</given-names>
</name>
<name>
<surname>Bose</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Iyengar</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bunyavanich</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pandey</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Clinical Features of COVID-19 Mortality: Development and Validation of a Clinical Prediction Model</article-title>. <source>Lancet Digital Health</source>. <volume>2</volume>, <fpage>e516</fpage>-<lpage>e525</lpage>. <pub-id pub-id-type="doi">10.1016/S2589-7500(20)30217-X</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>