<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Aging Neurosci.</journal-id>
<journal-title>Frontiers in Aging Neuroscience</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Aging Neurosci.</abbrev-journal-title>
<issn pub-type="epub">1663-4365</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fnagi.2022.945274</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Aging Neuroscience</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Develop a diagnostic tool for dementia using machine learning and non-imaging features</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Wang</surname> <given-names>Huan</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Sheng</surname> <given-names>Li</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Xu</surname> <given-names>Shanhu</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Jin</surname> <given-names>Yu</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Jin</surname> <given-names>Xiaoqing</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Qiao</surname> <given-names>Song</given-names></name>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1507397/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Chen</surname> <given-names>Qingqing</given-names></name>
<xref ref-type="aff" rid="aff4"><sup>4</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/960856/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Xing</surname> <given-names>Wenmin</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1159359/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname> <given-names>Zhenlei</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Yan</surname> <given-names>Jing</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1237544/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Mao</surname> <given-names>Genxiang</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/1159342/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Xu</surname> <given-names>Xiaogang</given-names></name>
<xref ref-type="aff" rid="aff5"><sup>5</sup></xref>
<xref ref-type="corresp" rid="c003"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/533139/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Department of Biostatistics, The George Washington University</institution>, <addr-line>Washington, DC</addr-line>, <country>United States</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Mathematics, Drexel University</institution>, <addr-line>Philadelphia, PA</addr-line>, <country>United States</country></aff>
<aff id="aff3"><sup>3</sup><institution>Department of Neurology, Affiliated Zhejiang Hospital, Zhejiang University School of Medicine, Zhejiang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff4"><sup>4</sup><institution>Department of Radiology, Sir Run Run Shaw Hospital, Zhejiang University School of Medicine</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<aff id="aff5"><sup>5</sup><institution>Zhejiang Provincial Key Lab of Geriatrics &#x0026; Geriatrics Institute of Zhejiang Province, Department of Geriatrics, Affiliated Zhejiang Hospital, Zhejiang University School of Medicine, Zhejiang University</institution>, <addr-line>Hangzhou</addr-line>, <country>China</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Wenquan Zou, Case Western Reserve University, United States</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Jintang Wang, Beijing Geriatric Hospital, China; Pai-Yi Chiu, Show Chwan Memorial Hospital, Taiwan; Goo-Rak Kwon, Chosun University, South Korea</p></fn>
<corresp id="c001">&#x002A;Correspondence: Jing Yan, <email>zjicu@vip.163.com</email></corresp>
<corresp id="c002">Genxiang Mao, <email>maogenxiang@163.com</email></corresp>
<corresp id="c003">Xiaogang Xu, <email>xuxg@zju.edu.cn</email></corresp>
<fn fn-type="other" id="fn004"><p>This article was submitted to Alzheimer&#x2019;s Disease and Related Dementias, a section of the journal Frontiers in Aging Neuroscience</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>29</day>
<month>08</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>14</volume>
<elocation-id>945274</elocation-id>
<history>
<date date-type="received">
<day>16</day>
<month>05</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>08</day>
<month>08</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2022 Wang, Sheng, Xu, Jin, Jin, Qiao, Chen, Xing, Zhao, Yan, Mao and Xu.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Wang, Sheng, Xu, Jin, Jin, Qiao, Chen, Xing, Zhao, Yan, Mao and Xu</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<sec>
<title>Background</title>
<p>Early identification of Alzheimer&#x2019;s disease or mild cognitive impairment can help guide direct prevention and supportive treatments, improve outcomes, and reduce medical costs. Existing advanced diagnostic tools are mostly based on neuroimaging and suffer from certain problems in cost, reliability, repeatability, accessibility, ease of use, and clinical integration. To address these problems, we developed, evaluated, and implemented an early diagnostic tool using machine learning and non-imaging factors.</p>
</sec>
<sec>
<title>Methods and results</title>
<p>A total of 654 participants aged 65 or older from the Nursing Home in Hangzhou, China were identified. Information collected from these patients includes dementia status and 70 demographic, cognitive, socioeconomic, and clinical features. Logistic regression, support vector machine (SVM), neural network, random forest, extreme gradient boosting (XGBoost), least absolute shrinkage and selection operator (LASSO), and best subset models were trained, tuned, and internally validated using a novel double cross validation algorithm and multiple evaluation metrics. The trained models were also compared and externally validated using a separate dataset with 1,100 participants from four communities in Zhejiang Province, China. The model with the best performance was then identified and implemented online with a friendly user interface. For the nursing dataset, the top three models are the neural network (AUROC = 0.9435), XGBoost (AUROC = 0.9398), and SVM with the polynomial kernel (AUROC = 0.9213). With the community dataset, the best three models are the random forest (AUROC = 0.9259), SVM with linear kernel (AUROC = 0.9282), and SVM with polynomial kernel (AUROC = 0.9213). The F1 scores and area under the precision-recall curve showed that the SVMs, neural network, and random forest were robust on the unbalanced community dataset. Overall the SVM with the polynomial kernel was found to be the best model. The LASSO and best subset models identified 17 features most relevant to dementia prediction, mostly from cognitive test results and socioeconomic characteristics.</p>
</sec>
<sec>
<title>Conclusion</title>
<p>Our non-imaging-based diagnostic tool can effectively predict dementia outcomes. The tool can be conveniently incorporated into clinical practice. Its online implementation allows zero barriers to its use, which enhances the disease&#x2019;s diagnosis, improves the quality of care, and reduces costs.</p>
</sec>
</abstract>
<kwd-group>
<kwd>dementia</kwd>
<kwd>Alzheimer&#x2019;s disease</kwd>
<kwd>early diagnostic tool</kwd>
<kwd>machine learning</kwd>
<kwd>non-imaging factors</kwd>
</kwd-group>
<counts>
<fig-count count="6"/>
<table-count count="3"/>
<equation-count count="0"/>
<ref-count count="64"/>
<page-count count="14"/>
<word-count count="8443"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1" sec-type="intro">
<title>Introduction</title>
<p>Dementia is a clinical syndrome of brain diseases, involving the progressive loss of memory, language, thinking and abilities of action, which seriously affects patients&#x2019; daily life and physical and mental health (<xref ref-type="bibr" rid="B44">Mitchell et al., 2009</xref>). The types of dementia are usually divided into Alzheimer&#x2019;s disease (AD), vascular dementia (VaD), frontotemporal dementia (FTD), dementia with Lewy bodies (DLB), and other dementias, of which Alzheimer&#x2019;s disease accounts for more than 60% (<xref ref-type="bibr" rid="B19">Geldmacher and Whitehouse, 1996</xref>; <xref ref-type="bibr" rid="B9">Bruun et al., 2018</xref>). Alzheimer&#x2019;s disease is a neurodegenerative disease of the nervous system associated with aging. The main features of Alzheimer&#x2019;s disease contain progressive memory impairment, visual-spatial ability, executive function impairments, amnesia, aphasia, apraxia, and agnosia, accompanied by personality and behavior changes. The amyloid beta (A&#x03B2;) in plaques, phosphorylated tau protein in neurofibrillary tangles are defining neuropathological features of AD (<xref ref-type="bibr" rid="B40">Long and Holtzman, 2019</xref>; <xref ref-type="bibr" rid="B51">Selkoe, 2019</xref>; <xref ref-type="bibr" rid="B30">Janelidze et al., 2020</xref>). With aging, the prevalence and incidence of Alzheimer&#x2019;s disease are increasing rapidly every year, which brings a heavy burden to patients, their families, and social and economic development (<xref ref-type="bibr" rid="B48">Rabins et al., 1982</xref>; <xref ref-type="bibr" rid="B5">Azevedo et al., 2021</xref>). Cognitive impairment that does not meet dementia criteria refers to mild cognitive impairment (MCI), which is consistently shown to have a high risk of progression to dementia (<xref ref-type="bibr" rid="B47">Petersen et al., 1999</xref>; <xref ref-type="bibr" rid="B21">Grundman et al., 2004</xref>). Unlike Alzheimer&#x2019;s disease patients, MCI patients have no significant effect on activities of daily work and life (<xref ref-type="bibr" rid="B17">Feldman et al., 2006</xref>).</p>
<p>Timely and accurate diagnosis of dementia is the key to the prevention and treatment of dementia. At present, the main methods used for dementia and MCI detection include clinical screening of scales, pathological tissue biopsy, and medical imaging diagnosis. Clinical screening of scales is the most common detection method used in clinical practice. This method mainly involves interactive communication between professionals and patients or patients&#x2019; family members. By objectively and comprehensively collecting information from multiple perspectives, clinical screening of scales can help make effective evaluation judgments (<xref ref-type="bibr" rid="B54">Sheehan, 2012</xref>; <xref ref-type="bibr" rid="B7">Bissig and DeCarli, 2019</xref>). Nevertheless, this method relies on the objectivity of data collection and the professional level of evaluators, and can therefore be time-consuming and expensive. Another method used in clinical and scientific studies is pathological tissue biopsy, which mainly examines biomarkers in the cerebrospinal fluid such as A&#x03B2; and Tau protein. Brain biopsies are rarely performed in clinics. The disadvantage of this approach is that its invasiveness and potential risk of complications can have a certain negative impact on the patient&#x2019;s health. In addition, even if the biopsy is negative, it does not completely rule out the possibility of dementia, because there may be lesions in other parts of the brain (<xref ref-type="bibr" rid="B61">Warren et al., 2005</xref>; <xref ref-type="bibr" rid="B33">Josephson et al., 2007</xref>; <xref ref-type="bibr" rid="B39">Leinonen et al., 2010</xref>). The third diagnostic method uses medical images, such as functional PET/MR. As an auxiliary diagnostic method, medical imaging is useful in many cases, e.g., to rule out the cognitive decline caused by secondary tumors or stroke. This method also has many limitations. First, given the high cost of equipment, not all hospitals can be equipped with corresponding testing equipment. Second, the cost of testing imposes a heavy financial burden to patients. Third, but not least, since the morphological and pathological changes in molecules and tissues may not be obvious at the early stage of the disease, imaging diagnosis often has blind spots in detection (<xref ref-type="bibr" rid="B45">Mosconi, 2013</xref>; <xref ref-type="bibr" rid="B28">Ishii, 2014</xref>; <xref ref-type="bibr" rid="B6">Barthel et al., 2015</xref>; <xref ref-type="bibr" rid="B56">Shivamurthy et al., 2015</xref>).</p>
<p>To assist and improve traditional dementia diagnosis methods, machine learning and deep learning have been increasingly applied in AD detection, especially in classifying neuroimaging data (<xref ref-type="bibr" rid="B46">Pellegrini et al., 2018</xref>; <xref ref-type="bibr" rid="B32">Jo et al., 2019</xref>). Frequently used machine learning algorithms to classify AD neuroimages include support vector machines (SVM) and artificial neural networks (ANN) (<xref ref-type="bibr" rid="B46">Pellegrini et al., 2018</xref>). With the development of deep learning techniques, the performance of deep learning models have in general surpassed that of machine learning in classifying neuroimaging data and have become the dominant method for dealing with such data. At present, the convolutional neural network (CNN) is the most widely used deep learning architecture for the diagnostic classification of AD, due to its effectiveness in dealing with imaging data (<xref ref-type="bibr" rid="B32">Jo et al., 2019</xref>). Compared with the CNN models trained from scratch in earlier years (<xref ref-type="bibr" rid="B50">Sarraf and Tofighi, 2016</xref>), most recently developed CNN models have incorporated transfer learning to make better use of small-scale datasets for better model performance (<xref ref-type="bibr" rid="B24">Hon and Khan, 2017</xref>; <xref ref-type="bibr" rid="B29">Islam and Zhang, 2017</xref>; <xref ref-type="bibr" rid="B1">Aderghal et al., 2018</xref>; <xref ref-type="bibr" rid="B15">Ding et al., 2019</xref>). The dimensions of the neural images CNN can process have also been upgraded from two to three (<xref ref-type="bibr" rid="B26">Hosseini-Asl et al., 2016</xref>; <xref ref-type="bibr" rid="B36">Khvostikov et al., 2018</xref>). In addition to CNN, some other important deep learning architectures have also been actively studied for AD diagnosis, including deep belief networks (<xref ref-type="bibr" rid="B11">Cai et al., 2016</xref>), deep auto-encoder (<xref ref-type="bibr" rid="B16">Dolph et al., 2017</xref>; <xref ref-type="bibr" rid="B55">Shi et al., 2017</xref>), recurrent neural network (<xref ref-type="bibr" rid="B14">Cui et al., 2019</xref>; <xref ref-type="bibr" rid="B38">Lee et al., 2019</xref>), etc.</p>
<p>Although neuroimaging based machine learning/deep learning algorithms have achieved a high accuracy in many AD classification tasks, these algorithms are not always the best path to build the automated AD diagnosis system for a number of reasons. First, training neuroimaging based models typically requires a large amount of high-quality labeled medical imaging, which can be a huge challenge because of the institutional barriers and the cost of collecting and labeling data. Second, due to the limitation of design, the image-based models typically cannot utilize other types of data that may contain specific information for prediction. Third, due to geographic, economic or other constraints, patients may not be able to access the established models or provide the image required by the model. Fourth, due to the complex structure or inherent &#x201C;black-box&#x201D; limitation, it is difficult to understand the relationship between selected variables and predicted results or the relative importance of each selected feature, resulting in difficulties in interpreting models and correcting potential biases arising from the training data. These problems can greatly limit models&#x2019; clinical relevance, practical application value, and the possibility of future improvement. Integration of non-imaging features (such as patient demographics, cognitive test results, clinical covariates, etc.) has been called to further advance the field of AD diagnosis (<xref ref-type="bibr" rid="B46">Pellegrini et al., 2018</xref>).</p>
<p>In this study, we explored the diagnostic effects of non-imaging features from the nursing home located in Hangzhou, Zhejiang Province, China. We employed a wide range of advanced machine learning models and validated these models in two ways: internally using a novel double cross-validation (CV) algorithm (<xref ref-type="bibr" rid="B37">Krstajic et al., 2014</xref>) and externally on a separate dataset from four communities in Zhejiang. Apart from developing predictive models, we analyzed the features that are important to the diagnosis of AD/MCI and discussed their roles in clinical practice. We also used the best-performing model to build an automated AD/MCI detection tool online. This study shows that non-imaging factors can be exploited to obtain rich predictive information and create good diagnostic models for AD/MCI. In the literature there are few studies on machine learning with non-imaging features to detect AD/MCI. <xref ref-type="bibr" rid="B52">Shankle et al. (1997)</xref> used decision tree learners, rule learners, and the Naive Bayesian classifier on the non-imaging dataset from University of California to learn the best decision rules to distinguish normal brain aging from the earliest stages of dementia. <xref ref-type="bibr" rid="B42">Maroco et al. (2011)</xref> compared 10 machine learning algorithms using several neuropsychological tests as predictors for predicting the evolution into dementia in elderly people with MCI. We note that the clinical questions investigated in these studies are different from the clinical question we studied, and that they lacked adequate internal/external valuation or online implementation. Therefore our research adds to the knowledge in this area.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and methods</title>
<sec id="S2.SS1">
<title>Data</title>
<p>The data were collected from the nursing home in Hangzhou, Zhejiang Province, China, between May and November 2014. Patients aged 65 or older were included and those in critical conditions were excluded. The data contain dementia status and 70 non-imaging features derived from demographic information (sex, age), cognitive tests [Mini-Cog test, clock drawing test (CDT), Mini-Mental State Exam (MMSE), and AD8 screening], socioeconomic information (education, main occupation before retirement, marital status), and clinic characteristics (past medical history, smoking status, alcohol status). Detailed definitions and demographic characteristics of the 70 features are listed in <xref ref-type="supplementary-material" rid="DS1">Supplementary Tables 1</xref>, <xref ref-type="supplementary-material" rid="DS1">2</xref>, respectively. The dementia status of patients were evaluated by experienced physicians based on the combination of the clinical diagnostic criteria for Alzheimer&#x2019;s disease, the Clinical Dementia Rating (CDR) scale, and reports from patients&#x2019; families about the patients&#x2019; daily life (e.g., memory of the way home, memory of past life, response to usual communication, etc.), and classified into three levels AD, MCI, non-AD/MCI (<xref ref-type="bibr" rid="B3">Albert et al., 2011</xref>; <xref ref-type="bibr" rid="B43">McKhann et al., 2011</xref>). To facilitate the analysis, we removed observations with missing values in cognitive status or any of the 70 features. The final nursing dataset for analysis includes 654 patients. See <xref ref-type="fig" rid="F1">Figure 1</xref> for a detailed data collection process.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Flow diagram of selecting participants from the nursing home and the communities.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-14-945274-g001.tif"/>
</fig>
<p>The nursing data were collected from the nursing home and hence were based on a population with a high risk of AD/MCI. In the final nursing dataset, 168 participants (25.7%) were diagnosed with AD, 182 (27.8%) with MCI, and 304 (46.5%) with Non-AD/MCI. It is seen that observed outcomes were roughly balanced for two classes (53.5% AD/MCI vs. 46.5% normal). Principal component analysis, a dimension reduction technique, was performed to reduce the nursing data into two-dimensional and visualize it (<xref ref-type="fig" rid="F2">Figure 2</xref>). The clusters of AD and non-AD/MCI barely overlap, while the cluster of MCI is mixed with the other two classes. This shows that three classes can present a clear pattern through non-imaging features.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Visualization of the nursing dataset after dimension reduction with principal component analysis. Black dots represent patients diagnosed with Alzheimer&#x2019;s disease (AD), red dots represent patients diagnosed with mild cognitive impairment (MCI), and green dots represent patients from neither class (non-AD/MCI).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-14-945274-g002.tif"/>
</fig>
<p>For validation purposes, we collected data with the same cognitive status and non-imaging features from four communities across 12 counties in Zhejiang province. A multi-stage stratified random cluster sampling method was adopted to select the communities. We first divided 12 counties into four groups based on economic levels, then systematically selected one district from each of these four groups, and finally randomly chose one community from each district. The same inclusion/exclusion criteria and data processing progress as for the nursing dataset were applied (<xref ref-type="fig" rid="F1">Figure 1</xref>). The final community dataset contains 1,100 cases, of which 59 (5.4%) were diagnosed with AD, 118 (10.7%) with MCI, and 923 (83.9%) with non-AD/MCI.</p>
<p>For the collection of the nursing and community data, ethics approval was obtained from the Ethics Committee of Zhejiang Hospital and informed consents were signed by participants.</p>
</sec>
<sec id="S2.SS2">
<title>Machine learning methods</title>
<sec id="S2.SS2.SSS1">
<title>Logistic regression</title>
<p>The logistic regression (<xref ref-type="bibr" rid="B25">Hosmer et al., 2013</xref>) is a classical machine learning method widely used in medical research. It performs well if there is a linear relationship between the features and logit of the outcome. Due to the simplicity of the design, inferences regarding the contribution of each feature in predicting the outcome can be easily drawn from the model. We used this simple but powerful classification model as a benchmark: the included machine learning models should have at least as good predictive performance as the logistic model.</p>
</sec>
<sec id="S2.SS2.SSS2">
<title>Support vector machines</title>
<p>The SVM (<xref ref-type="bibr" rid="B59">Vapnik, 2013</xref>), a state-of-the-art machine learning algorithm, is a generalization of linear decision boundaries for classification. It has successful applications in a variety of medical classification tasks, e.g., diagnosing heart valve diseases (<xref ref-type="bibr" rid="B13">Comak et al., 2007</xref>), breast cancer (<xref ref-type="bibr" rid="B2">Akay, 2009</xref>), diabetes (<xref ref-type="bibr" rid="B63">Yu et al., 2010</xref>), etc. Using a kernel function, SVM can transform the data into a higher-dimensional space and construct a linear boundary in the new space while generating a non-linear boundary in the original space. In this study, we tried four different SVM models SVM_l, SVM_r, SVM_s, and SVM_p, which correspond to models obtained by using linear, radial basis, sigmoid, and polynomial kernel functions, respectively.</p>
</sec>
<sec id="S2.SS2.SSS3">
<title>Neural networks</title>
<p>Neural networks are non-linear machine learning models with computing systems inspired by how the human brain processes information. They have been widely applied in image analysis, biochemical analysis, drug design, diagnostic systems, and other branches of human medicine (<xref ref-type="bibr" rid="B4">Amato et al., 2013</xref>). Despite the low interpretability, neural networks are very flexible and quite effective in purely predictive settings thanks to the model-free design. In this study, we used a feedforward neural network with a single layer of hidden neurons and L1 weight regularization, which can be thought of as a non-linear generalization of linear logistic regression. The single-layer design and weight regularization can constrain the complexity of the model and prevent it from overfitting.</p>
</sec>
<sec id="S2.SS2.SSS4">
<title>Random forests</title>
<p>Random forests use de-correlated tree predictors to build powerful classification models (<xref ref-type="bibr" rid="B8">Breiman, 2001</xref>). By combining predictions from a large collection of individual decision trees, random forests outperform the individual tree predictor and produce more accurate predictions. Being easy to understand and effective to use, random forests have many applications in the medical field, such as predicting Alzheimer&#x2019;s and other diseases (<xref ref-type="bibr" rid="B35">Khalilia et al., 2011</xref>; <xref ref-type="bibr" rid="B20">Gray et al., 2013</xref>; <xref ref-type="bibr" rid="B34">Kane et al., 2014</xref>). In the random forest, a small number of trees will lead to poor performance of the model while a large number will not cause the model to overfit (<xref ref-type="bibr" rid="B22">Hastie et al., 2001</xref>). Therefore, we used a large number of trees, 500 in this study, to build the random forest model. In the model training process, we also assessed the importance of each feature by computing the mean decrease in Gini Index (<xref ref-type="bibr" rid="B41">Louppe et al., 2013</xref>).</p>
</sec>
<sec id="S2.SS2.SSS5">
<title>XGBoosting</title>
<p>Boosting uses a combination of many &#x201C;weak&#x201D; classifiers to generate an ultimate strong classifier (<xref ref-type="bibr" rid="B22">Hastie et al., 2001</xref>). Though less popular than SVMs and random forests, boosting can provide outstanding prediction performance (<xref ref-type="bibr" rid="B64">Zhang et al., 2017</xref>). One popular boosting algorithm is gradient boosted decision trees (GBDT) (<xref ref-type="bibr" rid="B18">Friedman, 2002</xref>), which use the decision tree as the weak learner and use the gradient descent algorithm to minimize the loss function of the model. In this paper, we implemented XGBoost (short for &#x201C;Extreme Gradient Boosting&#x201D;), one of the most efficient implementations of GBDT (<xref ref-type="bibr" rid="B12">Chen and Guestrin, 2016</xref>). Compared to GBDT, XGBoost achieves better performance by introducing the regularization term in the loss function (the model is trained by minimizing the loss function) and using a second-order Taylor approximation for the loss function.</p>
</sec>
<sec id="S2.SS2.SSS6">
<title>The least absolute shrinkage and selection operator</title>
<p>To better understand the relationship between features and outcome variables, we employed the least absolute shrinkage and selection operator (LASSO) (<xref ref-type="bibr" rid="B58">Tibshirani, 1996</xref>), which allows automatic feature selection by adding an L1 regularization term to force coefficients of some features to be equal to zero. LASSO is a popular and arguably the most effective method for selecting features in a linear model (<xref ref-type="bibr" rid="B23">Hastie et al., 2017</xref>). It is especially useful when there is a need to analyze a large number of features. We implemented LASSO as a prediction model for AD/MCI. And we investigated the contribution of features to the outcome prediction by examining the coefficient paths of the model.</p>
</sec>
<sec id="S2.SS2.SSS7">
<title>Best subset</title>
<p>Best subset selection is another approach to finding the most relevant features to predict the outcome of interest. By definition, it requires evaluating possible subsets of the collection of all features according to some criteria. Although this approach has unmatched advantages in terms of interpretability, it is computationally demanding when the number of features is large and is computationally infeasible when cross-validation is used to evaluate subsets. In this study, we used a two-step search strategy to approximate the optimal result of best subset selection and reduce the computational requirement: (1) for each <italic>S</italic> = 1,2,&#x2026;,<italic>P</italic>, find the &#x201C;best&#x201D; <italic>S</italic> out of <italic>P</italic> features, where the best features here refer to the ones that can maximize the likelihood function of the logistic regression model (achieved by the &#x201C;BeSS.ONE&#x201D; function in the BeSS R package; <xref ref-type="bibr" rid="B62">Wen et al., 2017</xref>), (2) find the best number of <italic>S</italic> (achieved by regarding <italic>S</italic> as a parameter and tuning it with double CV).</p>
</sec>
</sec>
<sec id="S2.SS3">
<title>Evaluation metrics and validation methods</title>
<p>We performed both internal and external validation for all proposed machine learning models. The performance of all models was then assessed and compared according to sensitivity (recall), specificity, accuracy, area under the receiver operating characteristic curve (AUROC), precision, F1-score, and area under the precision-recall curve (AUPRC). Note that AUROC summarizes the trade-off between sensitivity and specificity while the F1-score (harmonic mean of the precision and recall) and AUPRC summarize the trade-off between sensitivity and precision.</p>
<p>We trained and internally evaluated our proposed machine learning models on the nursing dataset. The nursing dataset (350 cases) was relatively small compared to the 70 features and complex machine learning models we selected. Splitting the dataset into training, validation, and test sets allows parameter tuning. However, this method does not yield reliable estimates because of the small test set. On the other hand, the traditional <italic>k</italic>-fold CV can lead to over-optimistic estimates of the model&#x2019;s performance (<xref ref-type="bibr" rid="B60">Varma and Simon, 2006</xref>). Therefore, we considered a novel double CV that can take care of both model evaluation and parameter tuning (<xref ref-type="bibr" rid="B37">Krstajic et al., 2014</xref>). To perform the double CV, we divided the nursing dataset into 10 folds and performed the following for each model. (1) Left one fold for validation. (2) On the remaining 9 folds, performed a 10-fold CV to tune the parameters so that the optimal parameters maximized the average AUROC. (3) Used the optimal parameters to refit the model on the 9-folds. (4) Computed evaluation metrics for the model fitted in step (3) on the held-out fold in step (1). (5) Repeated steps (1)&#x2013;(4) 10 times across the 10 folds of the nursing dataset to obtain the 10 sets of evaluation metrics and optimal parameters. The performance of each model evaluated internally on the nursing dataset was then represented by the average of 10 sets of evaluation metrics, i.e., the double CV metrics. The process of performing double CV is illustrated in <xref ref-type="fig" rid="F3">Figure 3</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Flowchart of the double cross-validation.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-14-945274-g003.tif"/>
</fig>
<p>After internal validation, we performed an external validation for the models. The medians of 10 sets of optimal parameters from the double CV were used to train the final models on the whole nursing dataset. Then the evaluation metrics of each final model were computed on the community dataset.</p>
</sec>
<sec id="S2.SS4">
<title>Parameter optimization</title>
<p>In the inner loop of double CV, different parameter tuning methods were applied to different models. Logistic regression has no parameters to be tuned. Grid search was used in double CV to fine-tune the parameters in the four SVM models, neural network, random forest, LASSO, and best subset model. For the last two models, tuning parameters (L1 regularization parameter in LASSO and number of features &#x201C;<italic>S</italic>&#x201D; in the best subset) is effectively equivalent to performing feature selection. The XGBoost model contains many important parameters (e.g., learning rate, maximum depth of a tree, number of trees, etc.) and requires extensive tuning to reach the desired performance. To address this, we used the Gaussian process upper confidence bound (GP-UCB) algorithm (<xref ref-type="bibr" rid="B57">Srinivas et al., 2009</xref>) in the double CV to tune the parameters. GP-UCB is a popular Bayesian optimization algorithm that chooses parameters by controlling the exploration-exploitation tradeoffs.</p>
</sec>
<sec id="S2.SS5">
<title>Software</title>
<p>All statistical analyses were done in R (R version 3.6.2) using the following libraries: e1071, randomForest, nnet, NeuralNetTools, xgboost, rBayesianOptimization, glmnet, BeSS, ROCR, cutpointr, ggplot2, and their respective dependencies. The online screening tool was employed by using R Shiny.</p>
</sec>
</sec>
<sec id="S3" sec-type="results">
<title>Results</title>
<sec id="S3.SS1">
<title>Models&#x2019; evaluation and comparison</title>
<p>We have applied a number of different machine learning algorithms to build prediction models for detecting AD/MCI. It is of interest to compare these methods and determine which one performed best.</p>
<p><xref ref-type="table" rid="T1">Table 1</xref> compares demographic characteristics of age, sex, education, and summary scores of cognitive tests across the normal, MCI, and AD groups. <xref ref-type="table" rid="T2">Table 2</xref> reports the classification performance of each model evaluated internally by the double CV on the nursing dataset. The averages of the 10 values of sensitivity, specificity, accuracy, and AUROC in the outer loop of double CV were provided. It can be seen that the SVM_r model had the best sensitivity while the SVM_p had the best specificity. The SVM_p and LASSO had the best accuracy performance. The Neural network (<xref ref-type="fig" rid="F4">Figure 4</xref>) achieved the best AUROC, followed by XGBoost and SVM_p.</p>
<table-wrap position="float" id="T1">
<label>TABLE 1</label>
<caption><p>Demographic characteristics of age, sex, education, and summary scores of cognitive tests across the normal, MCI, and AD groups.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left"></td>
<td valign="top" align="center" colspan="4">Nursing dataset<hr/></td>
<td valign="top" align="center" colspan="4">Community dataset<hr/></td>
</tr>
<tr>
<td valign="top" align="left"/><td valign="top" align="center">AD</td>
<td valign="top" align="center">MCI</td>
<td valign="top" align="center">Non-AD/MCI</td>
<td valign="top" align="center">Overall</td>
<td valign="top" align="center">AD</td>
<td valign="top" align="center">MCI</td>
<td valign="top" align="center">Non-AD/MCI</td>
<td valign="top" align="center">Overall</td>
</tr>
<tr>
<td valign="top" align="left"/><td valign="top" align="center">(<italic>N</italic> = 168)</td>
<td valign="top" align="center">(<italic>N</italic> = 182)</td>
<td valign="top" align="center">(<italic>N</italic> = 304)</td>
<td valign="top" align="center">(<italic>N</italic> = 654)</td>
<td valign="top" align="center">(<italic>N</italic> = 59)</td>
<td valign="top" align="center">(<italic>N</italic> = 118)</td>
<td valign="top" align="center">(<italic>N</italic> = 923)</td>
<td valign="top" align="center">(<italic>N</italic> = 1,100)</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left"><bold>Sex</bold></td>
<td valign="top" align="center"/><td valign="top" align="center"/><td valign="top" align="center"/><td valign="top" align="center"/><td valign="top" align="center"/><td valign="top" align="center"/><td valign="top" align="center"/><td valign="top" align="center"/></tr>
<tr>
<td valign="top" align="left">Male</td>
<td valign="top" align="center">52 (31.0%)</td>
<td valign="top" align="center">63 (34.6%)</td>
<td valign="top" align="center">114 (37.5%)</td>
<td valign="top" align="center">229 (35.0%)</td>
<td valign="top" align="center">30 (50.8%)</td>
<td valign="top" align="center">48 (40.7%)</td>
<td valign="top" align="center">448 (48.5%)</td>
<td valign="top" align="center">526 (47.8%)</td>
</tr>
<tr>
<td valign="top" align="left">Female</td>
<td valign="top" align="center">116 (69.0%)</td>
<td valign="top" align="center">119 (65.4%)</td>
<td valign="top" align="center">190 (62.5%)</td>
<td valign="top" align="center">425 (65.0%)</td>
<td valign="top" align="center">29 (49.2%)</td>
<td valign="top" align="center">70 (59.3%)</td>
<td valign="top" align="center">475 (51.5%)</td>
<td valign="top" align="center">574 (52.2%)</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Age</bold> (SD)</td>
<td valign="top" align="center">85 (&#x00B1; 6.4)</td>
<td valign="top" align="center">85 (&#x00B1; 5.6)</td>
<td valign="top" align="center">82 (&#x00B1; 6.4)</td>
<td valign="top" align="center">84 (&#x00B1; 6.3)</td>
<td valign="top" align="center">80 (&#x00B1; 5.4)</td>
<td valign="top" align="center">79 (&#x00B1; 5.7)</td>
<td valign="top" align="center">75 (&#x00B1; 6.2)</td>
<td valign="top" align="center">76 (&#x00B1; 6.3)</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Education</bold> (SD)</td>
<td valign="top" align="center">2.3 (&#x00B1; 1.3)</td>
<td valign="top" align="center">2.7 (&#x00B1; 1.3)</td>
<td valign="top" align="center">3.4 (&#x00B1; 1.4)</td>
<td valign="top" align="center">2.9 (&#x00B1; 1.4)</td>
<td valign="top" align="center">2.4 (&#x00B1; 1.2)</td>
<td valign="top" align="center">2.9 (&#x00B1; 1.1)</td>
<td valign="top" align="center">3.4 (&#x00B1; 1.2)</td>
<td valign="top" align="center">3.3 (&#x00B1; 1.2)</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Summary score of mini-cog test</bold> (SD)</td>
<td valign="top" align="center">1.0 (&#x00B1; 1.1)</td>
<td valign="top" align="center">2.1 (&#x00B1; 1.2)</td>
<td valign="top" align="center">3.2 (&#x00B1; 0.88)</td>
<td valign="top" align="center">2.3 (&#x00B1; 1.4)</td>
<td valign="top" align="center">2.1 (&#x00B1; 1.2)</td>
<td valign="top" align="center">2.6 (&#x00B1; 1.2)</td>
<td valign="top" align="center">3.6 (&#x00B1; 0.69)</td>
<td valign="top" align="center">3.4 (&#x00B1; 0.90)</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Summary score of clock drawing test</bold> (SD)</td>
<td valign="top" align="center">0.98 (&#x00B1; 1.4)</td>
<td valign="top" align="center">2.4 (&#x00B1; 1.8)</td>
<td valign="top" align="center">4.2 (&#x00B1; 1.3)</td>
<td valign="top" align="center">2.9 (&#x00B1; 2.0)</td>
<td valign="top" align="center">3.1 (&#x00B1; 1.6)</td>
<td valign="top" align="center">3.9 (&#x00B1; 1.3)</td>
<td valign="top" align="center">4.7 (&#x00B1; 0.70)</td>
<td valign="top" align="center">4.6 (&#x00B1; 0.95)</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Summary score of mini-mental state exam</bold> (SD)</td>
<td valign="top" align="center">13 (&#x00B1; 6.6)</td>
<td valign="top" align="center">22 (&#x00B1; 4.3)</td>
<td valign="top" align="center">27 (&#x00B1; 2.6)</td>
<td valign="top" align="center">22 (&#x00B1; 7.2)</td>
<td valign="top" align="center">21 (&#x00B1; 4.7)</td>
<td valign="top" align="center">24 (&#x00B1; 3.8)</td>
<td valign="top" align="center">28 (&#x00B1; 2.2)</td>
<td valign="top" align="center">28 (&#x00B1; 3.2)</td>
</tr>
<tr>
<td valign="top" align="left"><bold>Summary score of AD8 screening</bold> (SD)</td>
<td valign="top" align="center">4.3 (&#x00B1; 2.6)</td>
<td valign="top" align="center">2.1 (&#x00B1; 1.8)</td>
<td valign="top" align="center">0.80 (&#x00B1; 1.1)</td>
<td valign="top" align="center">2.1 (&#x00B1; 2.3)</td>
<td valign="top" align="center">4.3 (&#x00B1; 2.2)</td>
<td valign="top" align="center">3.8 (&#x00B1; 2.0)</td>
<td valign="top" align="center">1.7 (&#x00B1; 1.1)</td>
<td valign="top" align="center">2.0 (&#x00B1; 1.5)</td>
</tr>
</tbody>
</table></table-wrap>
<table-wrap position="float" id="T2">
<label>TABLE 2</label>
<caption><p>Classification performance of each model evaluated internally by the double CV on the nursing dataset.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Method</td>
<td valign="top" align="center">Sensitivity</td>
<td valign="top" align="center">Specitivity</td>
<td valign="top" align="center">Accuracy</td>
<td valign="top" align="center">AUROC</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Logistic regression</td>
<td valign="top" align="center">0.8229</td>
<td valign="top" align="center">0.8289</td>
<td valign="top" align="center">0.8256</td>
<td valign="top" align="center">0.9068</td>
</tr>
<tr>
<td valign="top" align="left">SVM_l</td>
<td valign="top" align="center">0.8143</td>
<td valign="top" align="center">0.8453</td>
<td valign="top" align="center">0.8287</td>
<td valign="top" align="center">0.9127</td>
</tr>
<tr>
<td valign="top" align="left">SVM_r</td>
<td valign="top" align="center">0.8600</td>
<td valign="top" align="center">0.8455</td>
<td valign="top" align="center">0.8532</td>
<td valign="top" align="center">0.9287</td>
</tr>
<tr>
<td valign="top" align="left">SVM_s</td>
<td valign="top" align="center">0.8200</td>
<td valign="top" align="center">0.8976</td>
<td valign="top" align="center">0.8562</td>
<td valign="top" align="center">0.9374</td>
</tr>
<tr>
<td valign="top" align="left">SVM_p</td>
<td valign="top" align="center">0.8343</td>
<td valign="top" align="center">0.8947</td>
<td valign="top" align="center">0.8624</td>
<td valign="top" align="center">0.9378</td>
</tr>
<tr>
<td valign="top" align="left">Neural network</td>
<td valign="top" align="center">0.8429</td>
<td valign="top" align="center">0.8751</td>
<td valign="top" align="center">0.8578</td>
<td valign="top" align="center">0.9435</td>
</tr>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="center">0.8314</td>
<td valign="top" align="center">0.8618</td>
<td valign="top" align="center">0.8455</td>
<td valign="top" align="center">0.9340</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="center">0.8457</td>
<td valign="top" align="center">0.8552</td>
<td valign="top" align="center">0.8501</td>
<td valign="top" align="center">0.9398</td>
</tr>
<tr>
<td valign="top" align="left">LASSO</td>
<td valign="top" align="center">0.8400</td>
<td valign="top" align="center">0.8882</td>
<td valign="top" align="center">0.8624</td>
<td valign="top" align="center">0.9341</td>
</tr>
<tr>
<td valign="top" align="left">Best subset</td>
<td valign="top" align="center">0.8371</td>
<td valign="top" align="center">0.8553</td>
<td valign="top" align="center">0.8456</td>
<td valign="top" align="center">0.9141</td>
</tr>
</tbody>
</table></table-wrap>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>The final neural network model. Weights are color-coded by sign (blue+, gray&#x2212;) and thickness is in proportion to magnitude. Input features include sex, age, Mini-Cog test (c1&#x2013;c2), Clock Drawing test (d1&#x2013;d5), Mini-Mental State exam (e11&#x2013;e15, e21&#x2013;e25, e31&#x2013;e33, e41&#x2013;e45, e51&#x2013;e53, e61&#x2013;e62, e7, e8, e91&#x2013;e93, e10, e16), AD8 screening (f1&#x2013;f8), education (h1), occupation (h22&#x2013;h29), marital status (h32&#x2013;h35, h37), past medical history (h61&#x2013;66), number of medications (h8), smoking (h9), and drinking (h10).</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-14-945274-g004.tif"/>
</fig>
<p><xref ref-type="table" rid="T3">Table 3</xref> reports the classification performance of each model evaluated externally on the community dataset. Compared to the nursing dataset, the community data were collected at households and were based on a population with a low risk of AD/MCI. The observed outcomes were quite unbalanced between the two classes (16.1% AD/MCI vs. 83.9% normal). Therefore, in addition to sensitivity, specificity, accuracy, and AUROC, we recorded the metrics of precision, F1-score, and AUPRC as these metrics are especially useful for the unbalanced data. From <xref ref-type="table" rid="T3">Table 3</xref>, we can see that the SVM_r and SVM_p have the best accuracy. SVM_l, SVM_p, and random forest models are the top three models in terms of AUROC (&#x003E; 0.92). The SVM_r and SVM_p models had the highest F1-scores while logistic regression, XGBoost, and best subset models had poor F1-scores. The AUPRC values of SVM models, neural network, and random forest were relatively high, while those of the remaining models were relatively low.</p>
<table-wrap position="float" id="T3">
<label>TABLE 3</label>
<caption><p>Classification performance of each model evaluated externally on the community dataset.</p></caption>
<table cellspacing="5" cellpadding="5" frame="hsides" rules="groups">
<thead>
<tr>
<td valign="top" align="left">Method</td>
<td valign="top" align="center">Sensitivity</td>
<td valign="top" align="center">Specitivity</td>
<td valign="top" align="center">Accuracy</td>
<td valign="top" align="center">AUROC</td>
<td valign="top" align="center">Precision</td>
<td valign="top" align="center">F1-score</td>
<td valign="top" align="center">AUPRC</td>
</tr>
</thead>
<tbody>
<tr>
<td valign="top" align="left">Logistic regression</td>
<td valign="top" align="center">0.6215</td>
<td valign="top" align="center">0.8895</td>
<td valign="top" align="center">0.8464</td>
<td valign="top" align="center">0.8435</td>
<td valign="top" align="center">0.5189</td>
<td valign="top" align="center">0.5656</td>
<td valign="top" align="center">0.5199</td>
</tr>
<tr>
<td valign="top" align="left">SVM_l</td>
<td valign="top" align="center">0.5763</td>
<td valign="top" align="center">0.9458</td>
<td valign="top" align="center">0.8864</td>
<td valign="top" align="center">0.9282</td>
<td valign="top" align="center">0.6711</td>
<td valign="top" align="center">0.6201</td>
<td valign="top" align="center">0.6652</td>
</tr>
<tr>
<td valign="top" align="left">SVM_r</td>
<td valign="top" align="center">0.6102</td>
<td valign="top" align="center">0.9404</td>
<td valign="top" align="center">0.8873</td>
<td valign="top" align="center">0.9137</td>
<td valign="top" align="center">0.6626</td>
<td valign="top" align="center">0.6353</td>
<td valign="top" align="center">0.6395</td>
</tr>
<tr>
<td valign="top" align="left">SVM_s</td>
<td valign="top" align="center">0.5650</td>
<td valign="top" align="center">0.9437</td>
<td valign="top" align="center">0.8827</td>
<td valign="top" align="center">0.9177</td>
<td valign="top" align="center">0.6579</td>
<td valign="top" align="center">0.6079</td>
<td valign="top" align="center">0.6560</td>
</tr>
<tr>
<td valign="top" align="left">SVM_p</td>
<td valign="top" align="center">0.6045</td>
<td valign="top" align="center">0.9415</td>
<td valign="top" align="center">0.8873</td>
<td valign="top" align="center">0.9213</td>
<td valign="top" align="center">0.6646</td>
<td valign="top" align="center">0.6331</td>
<td valign="top" align="center">0.6549</td>
</tr>
<tr>
<td valign="top" align="left">Neural network</td>
<td valign="top" align="center">0.5876</td>
<td valign="top" align="center">0.9426</td>
<td valign="top" align="center">0.8855</td>
<td valign="top" align="center">0.9139</td>
<td valign="top" align="center">0.6624</td>
<td valign="top" align="center">0.6228</td>
<td valign="top" align="center">0.6513</td>
</tr>
<tr>
<td valign="top" align="left">Random forest</td>
<td valign="top" align="center">0.5706</td>
<td valign="top" align="center">0.9437</td>
<td valign="top" align="center">0.8836</td>
<td valign="top" align="center">0.9259</td>
<td valign="top" align="center">0.6601</td>
<td valign="top" align="center">0.6121</td>
<td valign="top" align="center">0.6623</td>
</tr>
<tr>
<td valign="top" align="left">XGBoost</td>
<td valign="top" align="center">0.5424</td>
<td valign="top" align="center">0.9415</td>
<td valign="top" align="center">0.8773</td>
<td valign="top" align="center">0.9006</td>
<td valign="top" align="center">0.6400</td>
<td valign="top" align="center">0.5872</td>
<td valign="top" align="center">0.6323</td>
</tr>
<tr>
<td valign="top" align="left">LASSO</td>
<td valign="top" align="center">0.5932</td>
<td valign="top" align="center">0.9393</td>
<td valign="top" align="center">0.8836</td>
<td valign="top" align="center">0.9023</td>
<td valign="top" align="center">0.6522</td>
<td valign="top" align="center">0.6213</td>
<td valign="top" align="center">0.6284</td>
</tr>
<tr>
<td valign="top" align="left">Best subset</td>
<td valign="top" align="center">0.4859</td>
<td valign="top" align="center">0.9274</td>
<td valign="top" align="center">0.8564</td>
<td valign="top" align="center">0.8483</td>
<td valign="top" align="center">0.5621</td>
<td valign="top" align="center">0.5212</td>
<td valign="top" align="center">0.5432</td>
</tr>
</tbody>
</table></table-wrap>
<p>Though, according to <xref ref-type="table" rid="T2">Tables 2</xref>, <xref ref-type="table" rid="T3">3</xref>, no model appears to be superior to all other models by all evaluation metrics, we can find some clues based on the accuracy and AUROC. The accuracy is the most common and intuitive metric to compare models&#x2019; performance. SVM_p and LASSO have the best accuracy in the internal validation (balanced data) while SVM_r and SVM_p have the best accuracy in the external validation (imbalanced data). According to this metric, the SVM and LASSO models seem to be the best models. However, we must note that accuracies have flaws in comparing models&#x2019; overall performance. First, the metric is limited to a single decision threshold (0.5 in this study), with which the model&#x2019;s prediction probability is compared to determine whether the outcome prediction is positive or negative. Second, the metric cannot be used to compare models that are built upon datasets with different outcome distributions. Third, the metric can be misleading on classification problems with a skewed class distribution. For example, the accuracy on a dataset with 10% positive cases can be at least 90% accurate.</p>
<p>Compared to the accuracy, AUROC is a more robust and informative evaluation metric as it summarizes the sensitivity and specificity across different decision thresholds and can be used to compare models on different (possibly skewed) outcome distributions. On the nursing dataset, the neural network, Xgboost, SVM_p have the highest AUROC values (<xref ref-type="fig" rid="F5">Figure 5A</xref>). However, the neural network and Xgboost have a low AUROC on the community dataset (<xref ref-type="fig" rid="F5">Figure 5B</xref>). On the community dataset, the SVM_l, random forest, and SVM_p were the top models in terms of AUROC, while the first two models had less performance than the third model on the nursing dataset. It can be seen that SVM_p is the only one performing well on both the nursing (balanced) and the community (unbalanced) datasets.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>ROC and PRC curves for the machine learning models for detecting dementia. <bold>(A)</bold> Mean ROC curves for the models on the nursing datasets. Each curve represents the mean ROC curve from the outer loop of the double cross validation. <bold>(B)</bold> ROC curves for the models on the community data. <bold>(C)</bold> PRC curves for the models on the community data.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-14-945274-g005.tif"/>
</fig>
<p>While ROC can be used for skewed outcome distributions, it may mask poor performance under unbalanced data (<xref ref-type="bibr" rid="B31">Jeni et al., 2013</xref>). F1 score and AUPRC, two metrics based on precision, are useful for the unbalanced setting since precision is an informative measure under imbalanced data (<xref ref-type="bibr" rid="B49">Saito and Rehmsmeier, 2015</xref>). We examined F1-score and AUPRC on the community dataset to rule out underperforming models on these two metrics. It can be seen that SVM_p has relatively high scores on these two measures (<xref ref-type="fig" rid="F5">Figure 5C</xref>), which again confirms that SVM_p is robust on the unbalanced data. Through the above analysis, we concluded that overall SVM_p is the best AD/MCI detection model. We had implemented SVM_p online for patients and healthcare professionals to access (R Shiny).<sup><xref ref-type="fn" rid="footnote1">1</xref></sup></p>
<p>In terms of AUROC, our SVM_p is one of the best-performing models in predicting dementia to date (<xref ref-type="bibr" rid="B27">Hou et al., 2019</xref>). While most published models relied on a small number of features and few reported (proper) validation results (<xref ref-type="bibr" rid="B46">Pellegrini et al., 2018</xref>; <xref ref-type="bibr" rid="B27">Hou et al., 2019</xref>), our models took advantage of 70 features and went through both internal (double cross) validation and external validation.</p>
<p>Therefore, our study made maximum use of the information from available features while ensuring the reliability and repeatability of the results.</p>
</sec>
<sec id="S3.SS2">
<title>Features&#x2019; contribution</title>
<p>Some of the machine learning models we built enabled us to see the contribution of the features for predicting AD/MCI. We studied the relative importance of features by the tree-based random forests and XGBoost models and further investigated the role of the important features by the Lasso model and the best subset model.</p>
<p>In the random forest model, the Gini index is used to decide which feature to split at each node within each component tree classifier. Each split of a node results in a decrease in Gini where the magnitude of the decrease indicates the discriminatory power of the split. For each feature, the decrease in the Gini index is accumulated each time the feature is selected to split a node. Therefore, the average decrease over all component tree classifiers for each feature can be used to represent the contribution of this feature to the prediction and thus serve as a measure of importance. A greater mean decrease means higher importance. Based on information gain, a measure similar to the mean decrease in Gini, the XGBoost can also compute each feature&#x2019;s contribution to the model using all the splits.</p>
<p><xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 1A</xref> presents the 20 most important features based on the final random forest model. It can be seen that the tests of counting down from 100 by 7 (e41-e45) and clocking drawing (d1-d5) are of most importance for predicting outcome. Mini-Cog test (c1-c2), time orientation test (e11-e15), and age have a lower level of importance. Of less importance is the test of copy drawing (e16), the test of repeating phrase (e7), the test of repeating previous items (e51-e53), medications (h8), and others. The feature importance rankings given by the XGBoost model are similar to those given by the random forest (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 1B</xref>), while the former highlights the importance of education (h1), and AD8 Dementia Screening (f1-f8), and the test of saying a complete sentence (e10).</p>
<p>To understand the specific impact of important features, we also studied the features selected by the LASSO and best subset model and analyzed the signs of the features&#x2019; coefficients. In the final LASSO model, the L1 regularization shrunk the coefficients of less important features to zero. There were 35 features considered by LASSO to be relevant to outcome prediction (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures 2A,B</xref>). In contrast, the best subset model selected 19 features (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2C</xref>), almost all of which are included in the features selected by LASSO. These results show that many non-imaging features could help predict AD/MCI.</p>
<p>Specifically, 17 were selected by both LASSO and best subset. These features were most likely to be relevant to AD/MCI prediction, including age, Mini-Cog test (c2), clocking drawing test (d2, d5), time orientation test (e15), address orientation test (e23), the test of counting down from 100 by 7 (e43, e44), the test of repeating previous items (e51, e52), the test of repeating previous items (e7), the test of saying a complete sentence (e10), AD8 Dementia Screening (f6, f8), education (h1), &#x201C;cadres staff&#x201D; in the occupation (h24), and &#x201C;married&#x201D; in the marital status (h32). For these 17 features, LASSO and the best subset agreed on the signs of their coefficients. These signs allow us to further understand the influence of the features on predicting the disease. From <xref ref-type="supplementary-material" rid="DS1">Supplementary Figure 2B</xref>, it can be seen that the coefficients of all test-related features were negative, which is reasonable since passing the test indicates a lower likelihood of developing AD/MCI. &#x201C;Married&#x201D; (compared to &#x201C;single&#x201D;) in the marital status also suggests a lower risk. On the other hand, age, &#x201C;handling complex personal financial matters&#x201D; (f6) and &#x201C;daily memory and thinking&#x201D; (f8) in AD8 screening, education, and &#x201C;cadres staff&#x201D; (compared to &#x201C;worker&#x201D;) in the occupation (h24) have positive coefficients, suggesting that these features are risk indicators.</p>
<p>In the nursing dataset, if we only look at education without considering other features, then education is negatively associated with ADI/MCI (<xref ref-type="fig" rid="F6">Figure 6A</xref>). But this relationship is reversed when other features are taken into account (<xref ref-type="supplementary-material" rid="DS1">Supplementary Figures 2B,C</xref>). These results of education echo the findings that the role of education can be controversial in predicting the risk of dementia (<xref ref-type="bibr" rid="B10">Caama&#x00F1;o-Isorna et al., 2006</xref>; <xref ref-type="bibr" rid="B53">Sharp and Gatz, 2011</xref>). Instead of being an independent risk factor, education could be a factor that protects against or delays the clinical manifestations of dementia. In other words, patients with a severe brain damage and a high educational level may present similar clinical symptoms of the disease as those with a less severe brain damage and a lower educational level. This view can also be confirmed by the results in <xref ref-type="fig" rid="F6">Figure 6B</xref> where education is highly positively correlated with cognitive abilities (Mini-Cog, Clock Drawing, MMSE) and negatively correlated with cognitive problems (AD8 Screening features). Therefore, our model in fact suggests that a higher educational level may mean more severe brain damage if cognitive levels are equal.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption><p>The role of education in predicting dementia. <bold>(A)</bold> The marginal distribution of the levels of education on the nursing dataset. <bold>(B)</bold> The correlation coefficients between education and other features on the nursing dataset.</p></caption>
<graphic mimetype="image" mime-subtype="tiff" xlink:href="fnagi-14-945274-g006.tif"/>
</fig>
</sec>
</sec>
<sec id="S4" sec-type="discussion">
<title>Discussion</title>
<p>We created and validated our AD/MCI diagnostic tool using extensive data collected from the nursing home and the communities. These data are readily available and closely related to clinical diagnosis, which makes our model highly applicable. The applicability of our tool is further enhanced by its online deployment. Patients and clinicians who do not understand machine learning algorithms can easily input the collected non-imaging features into our tool to obtain timely predictive results. Compared to the traditional clinical screening of scales, our approach simplifies the data collection task and quickly performs high-quality analysis, thus greatly improving the diagnostic efficiency of clinicians. In addition, our approach does not involve any risk of complications associated with invasive biopsies, nor rely on equipment and operators for medical imaging systems. These merits make our approach almost free of test costs or risk of use, therefore avoiding economic or health impacts on patients and their families. We believe it has great potential applications, especially in small cities and rural areas.</p>
</sec>
<sec id="S5" sec-type="conclusion">
<title>Conclusion</title>
<p>Automated diagnostic tools have become crucial in the diagnosis of dementia. Although neuro-images have been heavily used in recently developed tools, traditional non-imaging features can effectively diagnose dementia and conveniently incorporate clinical practice. We used a large number of non-imaging features and machine learning to create a highly performing dementia diagnostic tool. Our work leverages the predictive potential of non-imaging features and significantly lowers the barriers for using the diagnostic tool. We believe this study will have a direct impact on physicians&#x2019; diagnostic practice and patients&#x2019; self-screening.</p>
</sec>
<sec id="S6" sec-type="data-availability">
<title>Data availability statement</title>
<p>The original contributions presented in this study are included in the article/<xref ref-type="supplementary-material" rid="DS1">Supplementary material</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="S7">
<title>Author contributions</title>
<p>XX, HW, JY, and GM conceived and designed the study. SX, YJ, XJ, and SQ collected the data. HW, XX, LS, and QC performed data analysis. HW, XX, WX, and ZZ made the figures. HW and XX wrote the manuscript. All authors reviewed, approved the final version of the manuscript, and agreed to be accountable for the content of the work.</p>
</sec>
</body>
<back>
<sec id="S8" sec-type="funding-information">
<title>Funding</title>
<p>This study was supported by funds from the Zhejiang Province Basic Public Welfare Research Project (LGF21H250002), Chinese Traditional Medicine Science and Technology Projects of Zhejiang Province (2021ZB002 and 2022ZB002), and Health Bureau of Zhejiang Province (2019RC092 and 2020KY394).</p>
</sec>
<sec id="S9" sec-type="COI-statement">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec id="S10" sec-type="disclaimer">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="S11" sec-type="supplementary-material">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fnagi.2022.945274/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fnagi.2022.945274/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Data_Sheet_1.docx" id="DS1" mimetype="application/vnd.openxmlformats-officedocument.wordprocessingml.document" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<glossary>
<title>Abbreviations</title>
<def-list id="DL1">
<def-item><term>MCI</term><def><p>mild cognitive impairment</p></def></def-item>
<def-item><term>A&#x03B2;</term><def><p>amyloid beta</p></def></def-item>
<def-item><term>VaD</term><def><p>vascular dementia</p></def></def-item>
<def-item><term>FTD</term><def><p>frontotemporal dementia</p></def></def-item>
<def-item><term>DLB</term><def><p>dementia with Lewy bodies</p></def></def-item>
<def-item><term>SVM</term><def><p>support vector machine</p></def></def-item>
<def-item><term>XGBoost</term><def><p>extreme gradient boosting</p></def></def-item>
<def-item><term>LASSO</term><def><p>least absolute shrinkage and selection operator</p></def></def-item>
<def-item><term>ANN</term><def><p>artificial neural networks</p></def></def-item>
<def-item><term>CV</term><def><p>cross-validation</p></def></def-item>
<def-item><term>CDT</term><def><p>clock drawing test</p></def></def-item>
<def-item><term>MMSE</term><def><p>Mini-Mental State Exam</p></def></def-item>
<def-item><term>CDR</term><def><p>clinical dementia rating</p></def></def-item>
<def-item><term>GBDT</term><def><p>gradient boosted decision trees</p></def></def-item>
<def-item><term>AUROC</term><def><p>area under the receiver operating characteristic curve</p></def></def-item>
<def-item><term>AUPRC</term><def><p>area under the precision-recall curve</p></def></def-item>
<def-item><term>GP-UCB</term><def><p>Gaussian process upper confidence bound.</p></def></def-item>
</def-list>
</glossary>
<fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="https://hwmachinelearning.shinyapps.io/Dementia/">https://hwmachinelearning.shinyapps.io/Dementia/</ext-link></p></fn>
</fn-group>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aderghal</surname> <given-names>K.</given-names></name> <name><surname>Khvostikov</surname> <given-names>A.</given-names></name> <name><surname>Krylov</surname> <given-names>A.</given-names></name> <name><surname>Benois-Pineau</surname> <given-names>J.</given-names></name> <name><surname>Afdel</surname> <given-names>K.</given-names></name> <name><surname>Catheline</surname> <given-names>G.</given-names></name></person-group> (<year>2018</year>). &#x201C;<article-title>Classification of Alzheimer disease on imaging modalities with deep CNNs using cross-modal transfer learning</article-title>,&#x201D; in <source><italic>2018 IEEE 31st International Symposium on Computer-Based Medical Systems (CBMS)</italic></source>, (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>345</fpage>&#x2013;<lpage>350</lpage>. <pub-id pub-id-type="doi">10.1109/CBMS.2018.00067</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Akay</surname> <given-names>M. F.</given-names></name></person-group> (<year>2009</year>). <article-title>Support vector machines combined with feature selection for breast cancer diagnosis.</article-title> <source><italic>Expert Syst. Appl.</italic></source> <volume>36</volume> <fpage>3240</fpage>&#x2013;<lpage>3247</lpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2008.01.009</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Albert</surname> <given-names>M. S.</given-names></name> <name><surname>DeKosky</surname> <given-names>S. T.</given-names></name> <name><surname>Dickson</surname> <given-names>D.</given-names></name> <name><surname>Dubois</surname> <given-names>B.</given-names></name> <name><surname>Feldman</surname> <given-names>H. H.</given-names></name> <name><surname>Fox</surname> <given-names>N. C.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>The diagnosis of mild cognitive impairment due to Alzheimer&#x2019;s disease: Recommendations from the National Institute on Aging-Alzheimer&#x2019;s Association workgroups on diagnostic guidelines for Alzheimer&#x2019;s disease.</article-title> <source><italic>Alzheimers Dement.</italic></source> <volume>7</volume> <fpage>270</fpage>&#x2013;<lpage>279</lpage>. <pub-id pub-id-type="doi">10.1016/j.jalz.2011.03.008</pub-id> <pub-id pub-id-type="pmid">21514249</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Amato</surname> <given-names>F.</given-names></name> <name><surname>L&#x00F3;pez</surname> <given-names>A.</given-names></name> <name><surname>Pe&#x00F1;a-M&#x00E9;ndez</surname> <given-names>E. M.</given-names></name> <name><surname>Va&#x0148;hara</surname> <given-names>P.</given-names></name> <name><surname>Hampl</surname> <given-names>A.</given-names></name> <name><surname>Havel</surname> <given-names>J.</given-names></name></person-group> (<year>2013</year>). <source><italic>Artificial Neural Networks in Medical Diagnosis.</italic></source> <publisher-loc>Amsterdam</publisher-loc>: <publisher-name>Elsevier</publisher-name>. <pub-id pub-id-type="doi">10.2478/v10136-012-0031-x</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Azevedo</surname> <given-names>L.</given-names></name> <name><surname>Calandri</surname> <given-names>I. L.</given-names></name> <name><surname>Slachevsky</surname> <given-names>A.</given-names></name> <name><surname>Graviotto</surname> <given-names>H. G.</given-names></name> <name><surname>Vieira</surname> <given-names>M. C. S.</given-names></name> <name><surname>Andrade</surname> <given-names>C. B.</given-names></name><etal/></person-group> (<year>2021</year>). <article-title>Impact of Social Isolation on People with Dementia and Their Family Caregivers.</article-title> <source><italic>J. Alzheimers Dis.</italic></source> <volume>81</volume> <fpage>607</fpage>&#x2013;<lpage>617</lpage>. <pub-id pub-id-type="doi">10.3233/JAD-201580</pub-id> <pub-id pub-id-type="pmid">33814446</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barthel</surname> <given-names>H.</given-names></name> <name><surname>Schroeter</surname> <given-names>M. L.</given-names></name> <name><surname>Hoffmann</surname> <given-names>K. T.</given-names></name> <name><surname>Sabri</surname> <given-names>O.</given-names></name></person-group> (<year>2015</year>). <article-title>PET/MR in dementia and other neurodegenerative diseases.</article-title> <source><italic>Semin. Nucl. Med.</italic></source> <volume>45</volume> <fpage>224</fpage>&#x2013;<lpage>233</lpage>. <pub-id pub-id-type="doi">10.1053/j.semnuclmed.2014.12.003</pub-id> <pub-id pub-id-type="pmid">25841277</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bissig</surname> <given-names>D.</given-names></name> <name><surname>DeCarli</surname> <given-names>C. S.</given-names></name></person-group> (<year>2019</year>). <article-title>Global &#x0026; Community Health: Brief in-hospital cognitive screening anticipates complex admissions and may detect dementia.</article-title> <source><italic>Neurology</italic></source> <volume>92</volume> <fpage>631</fpage>&#x2013;<lpage>634</lpage>. <pub-id pub-id-type="doi">10.1212/WNL.0000000000007176</pub-id> <pub-id pub-id-type="pmid">30910941</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Breiman</surname> <given-names>L.</given-names></name></person-group> (<year>2001</year>). <article-title>Random forests.</article-title> <source><italic>Mach. Learn.</italic></source> <volume>45</volume> <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bruun</surname> <given-names>M.</given-names></name> <name><surname>Rhodius-Meester</surname> <given-names>H. F. M.</given-names></name> <name><surname>Koikkalainen</surname> <given-names>J.</given-names></name> <name><surname>Baroni</surname> <given-names>M.</given-names></name> <name><surname>Gjerum</surname> <given-names>L.</given-names></name> <name><surname>Lemstra</surname> <given-names>A. W.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Evaluating combinations of diagnostic tests to discriminate different dementia types.</article-title> <source><italic>Alzheimers Dement.</italic></source> <volume>10</volume> <fpage>509</fpage>&#x2013;<lpage>518</lpage>. <pub-id pub-id-type="doi">10.1016/j.dadm.2018.07.003</pub-id> <pub-id pub-id-type="pmid">30320203</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Caama&#x00F1;o-Isorna</surname> <given-names>F.</given-names></name> <name><surname>Corral</surname> <given-names>M.</given-names></name> <name><surname>Montes-Mart&#x00ED;nez</surname> <given-names>A.</given-names></name> <name><surname>Takkouche</surname> <given-names>B.</given-names></name></person-group> (<year>2006</year>). <article-title>Education and dementia: A meta-analytic study.</article-title> <source><italic>Neuroepidemiology</italic></source> <volume>26</volume> <fpage>226</fpage>&#x2013;<lpage>232</lpage>. <pub-id pub-id-type="doi">10.1159/000093378</pub-id> <pub-id pub-id-type="pmid">16707907</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cai</surname> <given-names>H.</given-names></name> <name><surname>Sha</surname> <given-names>X.</given-names></name> <name><surname>Han</surname> <given-names>X.</given-names></name> <name><surname>Wei</surname> <given-names>S.</given-names></name> <name><surname>Hu</surname> <given-names>B.</given-names></name></person-group> (<year>2016</year>). &#x201C;<article-title>Pervasive EEG diagnosis of depression using Deep Belief Network with three-electrodes EEG collector</article-title>,&#x201D; in <source><italic>2016 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)</italic></source>, (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>1239</fpage>&#x2013;<lpage>1246</lpage>.</citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>T.</given-names></name> <name><surname>Guestrin</surname> <given-names>C.</given-names></name></person-group> (<year>2016</year>). &#x201C;<article-title>Xgboost: A scalable tree boosting system</article-title>,&#x201D; in <source><italic>Proceedings of the 22nd ACM Sigkdd International Conference on Knowledge Discovery and Data Mining</italic></source>, (<publisher-loc>New York, NY</publisher-loc>: <publisher-name>Association for Computing Machinery</publisher-name>). <fpage>785</fpage>&#x2013;<lpage>794</lpage>. <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Comak</surname> <given-names>E.</given-names></name> <name><surname>Arslan</surname> <given-names>A.</given-names></name> <name><surname>Turkoglu</surname> <given-names>I.</given-names></name></person-group> (<year>2007</year>). <article-title>A decision support system based on support vector machines for diagnosis of the heart valve diseases.</article-title> <source><italic>Comput. Biol. Med.</italic></source> <volume>37</volume> <fpage>21</fpage>&#x2013;<lpage>27</lpage>. <pub-id pub-id-type="doi">10.1016/j.compbiomed.2005.11.002</pub-id> <pub-id pub-id-type="pmid">16426598</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cui</surname> <given-names>R.</given-names></name> <name><surname>Liu</surname> <given-names>M.</given-names></name> <name><surname>Alzheimer&#x2019;s Disease Neuroimaging</surname> <given-names>I.</given-names></name></person-group> (<year>2019</year>). <article-title>RNN-based longitudinal analysis for diagnosis of Alzheimer&#x2019;s disease.</article-title> <source><italic>Comput. Med. Imaging Graph.</italic></source> <volume>73</volume> <fpage>1</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.1016/j.compmedimag.2019.01.005</pub-id> <pub-id pub-id-type="pmid">30763637</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ding</surname> <given-names>Y.</given-names></name> <name><surname>Sohn</surname> <given-names>J. H.</given-names></name> <name><surname>Kawczynski</surname> <given-names>M. G.</given-names></name> <name><surname>Trivedi</surname> <given-names>H.</given-names></name> <name><surname>Harnish</surname> <given-names>R.</given-names></name> <name><surname>Jenkins</surname> <given-names>N. W.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>A Deep Learning Model to Predict a Diagnosis of Alzheimer Disease by Using (18)F-FDG PET of the Brain.</article-title> <source><italic>Radiology</italic></source> <volume>290</volume> <fpage>456</fpage>&#x2013;<lpage>464</lpage>. <pub-id pub-id-type="doi">10.1148/radiol.2018180958</pub-id> <pub-id pub-id-type="pmid">30398430</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dolph</surname> <given-names>C. V.</given-names></name> <name><surname>Alam</surname> <given-names>M.</given-names></name> <name><surname>Shboul</surname> <given-names>Z.</given-names></name> <name><surname>Samad</surname> <given-names>M. D.</given-names></name> <name><surname>Iftekharuddin</surname> <given-names>K. M.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Deep learning of texture and structural features for multiclass Alzheimer&#x2019;s disease classification</article-title>,&#x201D; in <source><italic>2017 International Joint Conference on Neural Networks (IJCNN)</italic></source>, (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>2259</fpage>&#x2013;<lpage>2266</lpage>. <pub-id pub-id-type="doi">10.1109/IJCNN.2017.7966129</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Feldman</surname> <given-names>H.</given-names></name> <name><surname>Ganguli</surname> <given-names>M.</given-names></name> <name><surname>Hampel</surname> <given-names>H.</given-names></name> <name><surname>Scheltens</surname> <given-names>P.</given-names></name> <name><surname>Tierney</surname> <given-names>M. C.</given-names></name> <name><surname>Whitehouse</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>International Psychogeriatric Association Expert Conference on mild cognitive impairment. Mild cognitive impairment.</article-title> <source><italic>Lancet</italic></source> <volume>367</volume> <fpage>1262</fpage>&#x2013;<lpage>1270</lpage>. <pub-id pub-id-type="doi">10.1016/S0140-6736(06)68542-5</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Friedman</surname> <given-names>J. H.</given-names></name></person-group> (<year>2002</year>). <article-title>Stochastic gradient boosting.</article-title> <source><italic>Comput. Stat. Data Anal.</italic></source> <volume>38</volume> <fpage>367</fpage>&#x2013;<lpage>378</lpage>. <pub-id pub-id-type="doi">10.1016/S0167-9473(01)00065-2</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Geldmacher</surname> <given-names>D. S.</given-names></name> <name><surname>Whitehouse</surname> <given-names>P. J.</given-names></name></person-group> (<year>1996</year>). <article-title>Evaluation of dementia.</article-title> <source><italic>N. Engl. J. Med.</italic></source> <volume>335</volume> <fpage>330</fpage>&#x2013;<lpage>336</lpage>. <pub-id pub-id-type="doi">10.1056/NEJM199608013350507</pub-id> <pub-id pub-id-type="pmid">8663868</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gray</surname> <given-names>K. R.</given-names></name> <name><surname>Aljabar</surname> <given-names>P.</given-names></name> <name><surname>Heckemann</surname> <given-names>R. A.</given-names></name> <name><surname>Hammers</surname> <given-names>A.</given-names></name> <name><surname>Rueckert</surname> <given-names>D.</given-names></name> <name><surname>Initiative</surname> <given-names>A. S. D. N.</given-names></name></person-group> (<year>2013</year>). <article-title>Random forest-based similarity measures for multi-modal classification of Alzheimer&#x2019;s disease.</article-title> <source><italic>NeuroImage</italic></source> <volume>65</volume> <fpage>167</fpage>&#x2013;<lpage>175</lpage>. <pub-id pub-id-type="doi">10.1016/j.neuroimage.2012.09.065</pub-id> <pub-id pub-id-type="pmid">23041336</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grundman</surname> <given-names>M.</given-names></name> <name><surname>Petersen</surname> <given-names>R. C.</given-names></name> <name><surname>Ferris</surname> <given-names>S. H.</given-names></name> <name><surname>Thomas</surname> <given-names>R. G.</given-names></name> <name><surname>Aisen</surname> <given-names>P. S.</given-names></name> <name><surname>Bennett</surname> <given-names>D. A.</given-names></name><etal/></person-group> (<year>2004</year>). <article-title>Mild cognitive impairment can be distinguished from Alzheimer disease and normal aging for clinical trials.</article-title> <source><italic>Arch. Neurol.</italic></source> <volume>61</volume> <fpage>59</fpage>&#x2013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1001/archneur.61.1.59</pub-id> <pub-id pub-id-type="pmid">14732621</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hastie</surname> <given-names>T.</given-names></name> <name><surname>Tibshirani</surname> <given-names>R.</given-names></name> <name><surname>Friedman</surname> <given-names>J.</given-names></name></person-group> (<year>2001</year>). <source><italic>The Elements of Statistical Learning. Springer Series in Statistics.</italic></source> <publisher-loc>Germany</publisher-loc>: <publisher-name>Springer</publisher-name>. <pub-id pub-id-type="doi">10.1007/978-0-387-21606-5</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hastie</surname> <given-names>T.</given-names></name> <name><surname>Tibshirani</surname> <given-names>R.</given-names></name> <name><surname>Tibshirani</surname> <given-names>R. J.</given-names></name></person-group> (<year>2017</year>). <article-title>Extended comparisons of best subset selection, forward stepwise selection, and the lasso.</article-title> <source><italic>arXiv.</italic></source> [<comment>Preprint</comment>].</citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hon</surname> <given-names>M.</given-names></name> <name><surname>Khan</surname> <given-names>N. M.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>Towards Alzheimer&#x2019;s disease classification through transfer learning</article-title>,&#x201D; in <source><italic>2017 IEEE International Conference on Bioinformatics and Biomedicine (BIBM)</italic></source>, (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>1166</fpage>&#x2013;<lpage>1169</lpage>. <pub-id pub-id-type="doi">10.1109/BIBM.2017.8217822</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hosmer</surname> <given-names>D. W.</given-names> <suffix>Jr.</suffix></name> <name><surname>Lemeshow</surname> <given-names>S.</given-names></name> <name><surname>Sturdivant</surname> <given-names>R. X.</given-names></name></person-group> (<year>2013</year>). <source><italic>Applied Logistic Regression.</italic></source> <publisher-loc>Hoboken</publisher-loc>: <publisher-name>John Wiley &#x0026; Sons.</publisher-name> <pub-id pub-id-type="doi">10.1002/9781118548387</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hosseini-Asl</surname> <given-names>E.</given-names></name> <name><surname>Keynton</surname> <given-names>R.</given-names></name> <name><surname>El-Baz</surname> <given-names>A.</given-names></name></person-group> (<year>2016</year>). &#x201C;<article-title>Alzheimer&#x2019;s disease diagnostics by adaptation of 3D convolutional network</article-title>,&#x201D; in <source><italic>2016 IEEE International Conference on Image Processing (ICIP)</italic></source>, (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>126</fpage>&#x2013;<lpage>130</lpage>. <pub-id pub-id-type="doi">10.1109/ICIP.2016.7532332</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hou</surname> <given-names>X.-H.</given-names></name> <name><surname>Feng</surname> <given-names>L.</given-names></name> <name><surname>Zhang</surname> <given-names>C.</given-names></name> <name><surname>Cao</surname> <given-names>X.-P.</given-names></name> <name><surname>Tan</surname> <given-names>L.</given-names></name> <name><surname>Yu</surname> <given-names>J.-T.</given-names></name></person-group> (<year>2019</year>). <article-title>Models for predicting risk of dementia: A systematic review.</article-title> <source><italic>J. Neurol. Neurosurg. Psychiatry</italic></source> <volume>90</volume> <fpage>373</fpage>&#x2013;<lpage>379</lpage>. <pub-id pub-id-type="doi">10.1136/jnnp-2018-318212</pub-id> <pub-id pub-id-type="pmid">29954871</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ishii</surname> <given-names>K.</given-names></name></person-group> (<year>2014</year>). <article-title>PET approaches for diagnosis of dementia.</article-title> <source><italic>AJNR Am. J. Neuroradiol.</italic></source> <volume>35</volume> <fpage>2030</fpage>&#x2013;<lpage>2038</lpage>. <pub-id pub-id-type="doi">10.3174/ajnr.A3695</pub-id> <pub-id pub-id-type="pmid">23945233</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Islam</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>Y.</given-names></name></person-group> (<year>2017</year>). &#x201C;<article-title>A novel deep learning based multi-class classification method for Alzheimer&#x2019;s disease detection using brain MRI data</article-title>,&#x201D; in <source><italic>International Conference on Brain Informatics</italic></source>, (<publisher-loc>Germany</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>213</fpage>&#x2013;<lpage>222</lpage>. <pub-id pub-id-type="doi">10.1007/978-3-319-70772-3_20</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Janelidze</surname> <given-names>S.</given-names></name> <name><surname>Mattsson</surname> <given-names>N.</given-names></name> <name><surname>Palmqvist</surname> <given-names>S.</given-names></name> <name><surname>Smith</surname> <given-names>R.</given-names></name> <name><surname>Beach</surname> <given-names>T. G.</given-names></name> <name><surname>Serrano</surname> <given-names>G. E.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Plasma P-tau181 in Alzheimer&#x2019;s disease: Relationship to other biomarkers, differential diagnosis, neuropathology and longitudinal progression to Alzheimer&#x2019;s dementia.</article-title> <source><italic>Nat. Med.</italic></source> <volume>26</volume> <fpage>379</fpage>&#x2013;<lpage>386</lpage>. <pub-id pub-id-type="doi">10.1038/s41591-020-0755-1</pub-id> <pub-id pub-id-type="pmid">32123385</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jeni</surname> <given-names>L. A.</given-names></name> <name><surname>Cohn</surname> <given-names>J. F.</given-names></name> <name><surname>De La Torre</surname> <given-names>F.</given-names></name></person-group> (<year>2013</year>). &#x201C;<article-title>Facing imbalanced data&#x2013;recommendations for the use of performance metrics</article-title>,&#x201D; in <source><italic>2013 Humaine Association Conference on Affective Computing and Intelligent Interaction</italic></source>, (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>IEEE</publisher-name>), <fpage>245</fpage>&#x2013;<lpage>251</lpage>. <pub-id pub-id-type="doi">10.1109/ACII.2013.47</pub-id> <pub-id pub-id-type="pmid">25574450</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Jo</surname> <given-names>T.</given-names></name> <name><surname>Nho</surname> <given-names>K.</given-names></name> <name><surname>Saykin</surname> <given-names>A. J.</given-names></name></person-group> (<year>2019</year>). <article-title>Deep Learning in Alzheimer&#x2019;s Disease: Diagnostic Classification and Prognostic Prediction Using Neuroimaging Data.</article-title> <source><italic>Front. Aging Neurosci.</italic></source> <volume>11</volume>:<fpage>220</fpage>. <pub-id pub-id-type="doi">10.3389/fnagi.2019.00220</pub-id> <pub-id pub-id-type="pmid">31481890</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Josephson</surname> <given-names>S. A.</given-names></name> <name><surname>Papanastassiou</surname> <given-names>A. M.</given-names></name> <name><surname>Berger</surname> <given-names>M. S.</given-names></name> <name><surname>Barbaro</surname> <given-names>N. M.</given-names></name> <name><surname>McDermott</surname> <given-names>M. W.</given-names></name> <name><surname>Hilton</surname> <given-names>J. F.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>The diagnostic utility of brain biopsy procedures in patients with rapidly deteriorating neurological conditions or dementia.</article-title> <source><italic>J. Neurosurg.</italic></source> <volume>106</volume> <fpage>72</fpage>&#x2013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.3171/jns.2007.106.1.72</pub-id> <pub-id pub-id-type="pmid">17236490</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kane</surname> <given-names>M. J.</given-names></name> <name><surname>Price</surname> <given-names>N.</given-names></name> <name><surname>Scotch</surname> <given-names>M.</given-names></name> <name><surname>Rabinowitz</surname> <given-names>P.</given-names></name></person-group> (<year>2014</year>). <article-title>Comparison of ARIMA and Random Forest time series models for prediction of avian influenza H5N1 outbreaks.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>15</volume>:<fpage>276</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-15-276</pub-id> <pub-id pub-id-type="pmid">25123979</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khalilia</surname> <given-names>M.</given-names></name> <name><surname>Chakraborty</surname> <given-names>S.</given-names></name> <name><surname>Popescu</surname> <given-names>M.</given-names></name></person-group> (<year>2011</year>). <article-title>Predicting disease risks from highly imbalanced data using random forest.</article-title> <source><italic>BMC Med. Inform. Decis. Mak.</italic></source> <volume>11</volume>:<fpage>51</fpage>. <pub-id pub-id-type="doi">10.1186/1472-6947-11-51</pub-id> <pub-id pub-id-type="pmid">21801360</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Khvostikov</surname> <given-names>A.</given-names></name> <name><surname>Aderghal</surname> <given-names>K.</given-names></name> <name><surname>Benois-Pineau</surname> <given-names>J.</given-names></name> <name><surname>Krylov</surname> <given-names>A.</given-names></name> <name><surname>Catheline</surname> <given-names>G.</given-names></name></person-group> (<year>2018</year>). <article-title>3D CNN-based classification using sMRI and MD-DTI images for Alzheimer disease studies.</article-title> <source><italic>arXiv</italic></source> [<comment>Preprint</comment>].</citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Krstajic</surname> <given-names>D.</given-names></name> <name><surname>Buturovic</surname> <given-names>L. J.</given-names></name> <name><surname>Leahy</surname> <given-names>D. E.</given-names></name> <name><surname>Thomas</surname> <given-names>S.</given-names></name></person-group> (<year>2014</year>). <article-title>Cross-validation pitfalls when selecting and assessing regression and classification models.</article-title> <source><italic>J. Cheminform.</italic></source> <volume>6</volume>:<fpage>10</fpage>. <pub-id pub-id-type="doi">10.1186/1758-2946-6-10</pub-id> <pub-id pub-id-type="pmid">24678909</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lee</surname> <given-names>G.</given-names></name> <name><surname>Nho</surname> <given-names>K.</given-names></name> <name><surname>Kang</surname> <given-names>B.</given-names></name> <name><surname>Sohn</surname> <given-names>K. A.</given-names></name> <name><surname>Kim</surname> <given-names>D.</given-names></name> <name><surname>for Alzheimer&#x2019;s Disease Neuroimaging</surname> <given-names>I.</given-names></name></person-group> (<year>2019</year>). <article-title>Predicting Alzheimer&#x2019;s disease progression using multi-modal deep learning approach.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>9</volume>:<fpage>1952</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-018-37769-z</pub-id> <pub-id pub-id-type="pmid">30760848</pub-id></citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Leinonen</surname> <given-names>V.</given-names></name> <name><surname>Koivisto</surname> <given-names>A. M.</given-names></name> <name><surname>Savolainen</surname> <given-names>S.</given-names></name> <name><surname>Rummukainen</surname> <given-names>J.</given-names></name> <name><surname>Tamminen</surname> <given-names>J. N.</given-names></name> <name><surname>Tillgren</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Amyloid and tau proteins in cortical brain biopsy and Alzheimer&#x2019;s disease.</article-title> <source><italic>Ann. Neurol.</italic></source> <volume>68</volume> <fpage>446</fpage>&#x2013;<lpage>453</lpage>. <pub-id pub-id-type="doi">10.1002/ana.22100</pub-id> <pub-id pub-id-type="pmid">20976765</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Long</surname> <given-names>J. M.</given-names></name> <name><surname>Holtzman</surname> <given-names>D. M.</given-names></name></person-group> (<year>2019</year>). <article-title>Alzheimer Disease: An Update on Pathobiology and Treatment Strategies.</article-title> <source><italic>Cell</italic></source> <volume>179</volume> <fpage>312</fpage>&#x2013;<lpage>339</lpage>. <pub-id pub-id-type="doi">10.1016/j.cell.2019.09.001</pub-id> <pub-id pub-id-type="pmid">31564456</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Louppe</surname> <given-names>G.</given-names></name> <name><surname>Wehenkel</surname> <given-names>L.</given-names></name> <name><surname>Sutera</surname> <given-names>A.</given-names></name> <name><surname>Geurts</surname> <given-names>P.</given-names></name></person-group> (<year>2013</year>). <article-title>Understanding variable importances in forests of randomized trees.</article-title> <source><italic>Adv. Neural. Inf. Process. Syst.</italic></source> <volume>26</volume> <fpage>431</fpage>&#x2013;<lpage>439</lpage>.</citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maroco</surname> <given-names>J.</given-names></name> <name><surname>Silva</surname> <given-names>D.</given-names></name> <name><surname>Rodrigues</surname> <given-names>A.</given-names></name> <name><surname>Guerreiro</surname> <given-names>M.</given-names></name> <name><surname>Santana</surname> <given-names>I.</given-names></name> <name><surname>de Mendon&#x00E7;a</surname> <given-names>A.</given-names></name></person-group> (<year>2011</year>). <article-title>Data mining methods in the prediction of Dementia: A real-data comparison of the accuracy, sensitivity and specificity of linear discriminant analysis, logistic regression, neural networks, support vector machines, classification trees and random forests.</article-title> <source><italic>BMC Res. Notes</italic></source> <volume>4</volume>:<fpage>299</fpage>. <pub-id pub-id-type="doi">10.1186/1756-0500-4-299</pub-id> <pub-id pub-id-type="pmid">21849043</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McKhann</surname> <given-names>G. M.</given-names></name> <name><surname>Knopman</surname> <given-names>D. S.</given-names></name> <name><surname>Chertkow</surname> <given-names>H.</given-names></name> <name><surname>Hyman</surname> <given-names>B. T.</given-names></name> <name><surname>Jack</surname> <given-names>C. R.</given-names> <suffix>Jr.</suffix></name> <name><surname>Kawas</surname> <given-names>C. H.</given-names></name><etal/></person-group> (<year>2011</year>). <article-title>The diagnosis of dementia due to Alzheimer&#x2019;s disease: Recommendations from the National Institute on Aging-Alzheimer&#x2019;s Association workgroups on diagnostic guidelines for Alzheimer&#x2019;s disease.</article-title> <source><italic>Alzheimers Dement.</italic></source> <volume>7</volume> <fpage>263</fpage>&#x2013;<lpage>269</lpage>. <pub-id pub-id-type="doi">10.1016/j.jalz.2011.03.005</pub-id> <pub-id pub-id-type="pmid">21514250</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mitchell</surname> <given-names>S. L.</given-names></name> <name><surname>Teno</surname> <given-names>J. M.</given-names></name> <name><surname>Kiely</surname> <given-names>D. K.</given-names></name> <name><surname>Shaffer</surname> <given-names>M. L.</given-names></name> <name><surname>Jones</surname> <given-names>R. N.</given-names></name> <name><surname>Prigerson</surname> <given-names>H. G.</given-names></name><etal/></person-group> (<year>2009</year>). <article-title>The clinical course of advanced dementia.</article-title> <source><italic>N. Engl. J. Med.</italic></source> <volume>361</volume> <fpage>1529</fpage>&#x2013;<lpage>1538</lpage>. <pub-id pub-id-type="doi">10.1056/NEJMoa0902234</pub-id> <pub-id pub-id-type="pmid">19828530</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mosconi</surname> <given-names>L.</given-names></name></person-group> (<year>2013</year>). <article-title>Glucose metabolism in normal aging and Alzheimer&#x2019;s disease: Methodological and physiological considerations for PET studies.</article-title> <source><italic>Clin. Transl. Imaging</italic></source> <volume>1</volume>:<fpage>10</fpage>. <pub-id pub-id-type="doi">10.1007/s40336-013-0026-y</pub-id> <pub-id pub-id-type="pmid">24409422</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Pellegrini</surname> <given-names>E.</given-names></name> <name><surname>Ballerini</surname> <given-names>L.</given-names></name> <name><surname>Hernandez</surname> <given-names>M.</given-names></name> <name><surname>Chappell</surname> <given-names>F. M.</given-names></name> <name><surname>Gonzalez-Castro</surname> <given-names>V.</given-names></name> <name><surname>Anblagan</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Machine learning of neuroimaging for assisted diagnosis of cognitive impairment and dementia: A systematic review.</article-title> <source><italic>Alzheimers Dement.</italic></source> <volume>10</volume> <fpage>519</fpage>&#x2013;<lpage>535</lpage>. <pub-id pub-id-type="doi">10.1016/j.dadm.2018.07.004</pub-id> <pub-id pub-id-type="pmid">30364671</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Petersen</surname> <given-names>R. C.</given-names></name> <name><surname>Smith</surname> <given-names>G. E.</given-names></name> <name><surname>Waring</surname> <given-names>S. C.</given-names></name> <name><surname>Ivnik</surname> <given-names>R. J.</given-names></name> <name><surname>Tangalos</surname> <given-names>E. G.</given-names></name> <name><surname>Kokmen</surname> <given-names>E.</given-names></name></person-group> (<year>1999</year>). <article-title>Mild cognitive impairment: Clinical characterization and outcome.</article-title> <source><italic>Arch. Neurol.</italic></source> <volume>56</volume> <fpage>303</fpage>&#x2013;<lpage>308</lpage>. <pub-id pub-id-type="doi">10.1001/archneur.56.3.303</pub-id> <pub-id pub-id-type="pmid">10190820</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rabins</surname> <given-names>P. V.</given-names></name> <name><surname>Mace</surname> <given-names>N. L.</given-names></name> <name><surname>Lucas</surname> <given-names>M. J.</given-names></name></person-group> (<year>1982</year>). <article-title>The impact of dementia on the family.</article-title> <source><italic>JAMA</italic></source> <volume>248</volume> <fpage>333</fpage>&#x2013;<lpage>335</lpage>. <pub-id pub-id-type="doi">10.1001/jama.1982.03330030039022</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Saito</surname> <given-names>T.</given-names></name> <name><surname>Rehmsmeier</surname> <given-names>M.</given-names></name></person-group> (<year>2015</year>). <article-title>The precision-recall plot is more informative than the ROC plot when evaluating binary classifiers on imbalanced datasets.</article-title> <source><italic>PLoS One</italic></source> <volume>10</volume>:<fpage>e0118432</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0118432</pub-id> <pub-id pub-id-type="pmid">25738806</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sarraf</surname> <given-names>S.</given-names></name> <name><surname>Tofighi</surname> <given-names>G.</given-names></name></person-group> (<year>2016</year>). <article-title>Classification of alzheimer&#x2019;s disease using fmri data and deep learning convolutional neural networks.</article-title> <source><italic>arXiv</italic></source> [<comment>Preprint</comment>].</citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Selkoe</surname> <given-names>D. J.</given-names></name></person-group> (<year>2019</year>). <article-title>Early network dysfunction in Alzheimer&#x2019;s disease.</article-title> <source><italic>Science</italic></source> <volume>365</volume> <fpage>540</fpage>&#x2013;<lpage>541</lpage>. <pub-id pub-id-type="doi">10.1126/science.aay5188</pub-id> <pub-id pub-id-type="pmid">31395769</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shankle</surname> <given-names>W. R.</given-names></name> <name><surname>Mani</surname> <given-names>S.</given-names></name> <name><surname>Pazzani</surname> <given-names>M. J.</given-names></name> <name><surname>Smyth</surname> <given-names>P.</given-names></name></person-group> (<year>1997</year>). &#x201C;<article-title>Detecting very early stages of dementia from normal aging with machine learning methods</article-title>,&#x201D; in <source><italic>Conference on Artificial Intelligence in Medicine in Europe</italic></source>, (<publisher-loc>Berlin</publisher-loc>: <publisher-name>Springer</publisher-name>), <fpage>71</fpage>&#x2013;<lpage>85</lpage>. <pub-id pub-id-type="doi">10.1007/BFb0029438</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sharp</surname> <given-names>E. S.</given-names></name> <name><surname>Gatz</surname> <given-names>M.</given-names></name></person-group> (<year>2011</year>). <article-title>The relationship between education and dementia an updated systematic review.</article-title> <source><italic>Alzheimer Dis. Assoc. Disord.</italic></source> <volume>25</volume>:<fpage>289</fpage>. <pub-id pub-id-type="doi">10.1097/WAD.0b013e318211c83c</pub-id> <pub-id pub-id-type="pmid">21750453</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sheehan</surname> <given-names>B.</given-names></name></person-group> (<year>2012</year>). <article-title>Assessment scales in dementia.</article-title> <source><italic>Ther. Adv. Neurol. Disord.</italic></source> <volume>5</volume> <fpage>349</fpage>&#x2013;<lpage>358</lpage>. <pub-id pub-id-type="doi">10.1177/1756285612455733</pub-id> <pub-id pub-id-type="pmid">23139705</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shi</surname> <given-names>B.</given-names></name> <name><surname>Chen</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>P.</given-names></name> <name><surname>Smith</surname> <given-names>C. D.</given-names></name> <name><surname>Liu</surname> <given-names>J.</given-names></name> <name><surname>Initiative</surname> <given-names>A. S. D. N.</given-names></name></person-group> (<year>2017</year>). <article-title>Nonlinear feature transformation and deep fusion for Alzheimer&#x2019;s Disease staging analysis.</article-title> <source><italic>Pattern Recognize.</italic></source> <volume>63</volume> <fpage>487</fpage>&#x2013;<lpage>498</lpage>. <pub-id pub-id-type="doi">10.1016/j.patcog.2016.09.032</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shivamurthy</surname> <given-names>V. K.</given-names></name> <name><surname>Tahari</surname> <given-names>A. K.</given-names></name> <name><surname>Marcus</surname> <given-names>C.</given-names></name> <name><surname>Subramaniam</surname> <given-names>R. M.</given-names></name></person-group> (<year>2015</year>). <article-title>Brain FDG PET and the diagnosis of dementia.</article-title> <source><italic>AJR Am. J. Roentgenol.</italic></source> <volume>204</volume> <fpage>W76</fpage>&#x2013;<lpage>W85</lpage>. <pub-id pub-id-type="doi">10.2214/AJR.13.12363</pub-id> <pub-id pub-id-type="pmid">25539279</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Srinivas</surname> <given-names>N.</given-names></name> <name><surname>Krause</surname> <given-names>A.</given-names></name> <name><surname>Kakade</surname> <given-names>S. M.</given-names></name> <name><surname>Seeger</surname> <given-names>M.</given-names></name></person-group> (<year>2009</year>). <article-title>Gaussian process optimization in the bandit setting: No regret and experimental design.</article-title> <source><italic>Proceedings of the 27th International Conference on Machine Learning</italic></source>, <publisher-loc>Pennsylvania</publisher-loc>: <publisher-name>University of Pennsylvania</publisher-name>. 1015-1022</citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tibshirani</surname> <given-names>R.</given-names></name></person-group> (<year>1996</year>). <article-title>Regression shrinkage and selection via the lasso.</article-title> <source><italic>J. R Stat. Soc.</italic></source> <volume>58</volume> <fpage>267</fpage>&#x2013;<lpage>288</lpage>. <pub-id pub-id-type="doi">10.1111/j.2517-6161.1996.tb02080.x</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Vapnik</surname> <given-names>V.</given-names></name></person-group> (<year>2013</year>). <source><italic>The Nature of Statistical Learning Theory.</italic></source> <publisher-loc>Germany</publisher-loc>: <publisher-name>Springer science &#x0026; business media</publisher-name>.</citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Varma</surname> <given-names>S.</given-names></name> <name><surname>Simon</surname> <given-names>R.</given-names></name></person-group> (<year>2006</year>). <article-title>Bias in error estimation when using cross-validation for model selection.</article-title> <source><italic>BMC Bioinformatics</italic></source> <volume>7</volume>:<fpage>91</fpage>. <pub-id pub-id-type="doi">10.1186/1471-2105-7-91</pub-id> <pub-id pub-id-type="pmid">16504092</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Warren</surname> <given-names>J. D.</given-names></name> <name><surname>Schott</surname> <given-names>J. M.</given-names></name> <name><surname>Fox</surname> <given-names>N. C.</given-names></name> <name><surname>Thom</surname> <given-names>M.</given-names></name> <name><surname>Revesz</surname> <given-names>T.</given-names></name> <name><surname>Holton</surname> <given-names>J. L.</given-names></name><etal/></person-group> (<year>2005</year>). <article-title>Brain biopsy in dementia.</article-title> <source><italic>Brain</italic></source> <volume>128</volume> <fpage>2016</fpage>&#x2013;<lpage>2025</lpage>. <pub-id pub-id-type="doi">10.1093/brain/awh543</pub-id> <pub-id pub-id-type="pmid">15901648</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wen</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>A.</given-names></name> <name><surname>Quan</surname> <given-names>S.</given-names></name> <name><surname>Wang</surname> <given-names>X.</given-names></name></person-group> (<year>2017</year>). <article-title>Bess: An r package for best subset selection in linear, logistic and CoxPH models.</article-title> <source><italic>J. Stat. Softw.</italic></source> <volume>94</volume> <fpage>1</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v094.i04</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>W.</given-names></name> <name><surname>Liu</surname> <given-names>T.</given-names></name> <name><surname>Valdez</surname> <given-names>R.</given-names></name> <name><surname>Gwinn</surname> <given-names>M.</given-names></name> <name><surname>Khoury</surname> <given-names>M. J.</given-names></name></person-group> (<year>2010</year>). <article-title>Application of support vector machine modeling for prediction of common diseases: The case of diabetes and pre-diabetes.</article-title> <source><italic>BMC Med. Inform. Decis. Mak.</italic></source> <volume>10</volume>:<fpage>16</fpage>. <pub-id pub-id-type="doi">10.1186/1472-6947-10-16</pub-id> <pub-id pub-id-type="pmid">20307319</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhang</surname> <given-names>C.</given-names></name> <name><surname>Liu</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>X.</given-names></name> <name><surname>Almpanidis</surname> <given-names>G.</given-names></name></person-group> (<year>2017</year>). <article-title>An up-to-date comparison of state-of-the-art classification algorithms.</article-title> <source><italic>Expert Syst. Appl.</italic></source> <volume>82</volume> <fpage>128</fpage>&#x2013;<lpage>150</lpage>. <pub-id pub-id-type="doi">10.1016/j.eswa.2017.04.003</pub-id></citation></ref>
</ref-list>
</back>
</article>