<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Pharmacol.</journal-id>
<journal-title>Frontiers in Pharmacology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Pharmacol.</abbrev-journal-title>
<issn pub-type="epub">1663-9812</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1216182</article-id>
<article-id pub-id-type="doi">10.3389/fphar.2023.1216182</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Pharmacology</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Development and economic assessment of machine learning models to predict glycosylated hemoglobin in type 2 diabetes</article-title>
<alt-title alt-title-type="left-running-head">Tong et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fphar.2023.1216182">10.3389/fphar.2023.1216182</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Tong</surname>
<given-names>Yi-Tong</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Gao</surname>
<given-names>Guang-Jie</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chang</surname>
<given-names>Huan</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Wu</surname>
<given-names>Xing-Wei</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2265554/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Li</surname>
<given-names>Meng-Ting</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1924149/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Chengdu Second People&#x2019;s Hospital</institution>, <addr-line>Chengdu</addr-line>, <addr-line>Sichuan</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Personalized Drug Therapy Key Laboratory of Sichuan Province</institution>, <institution>Department of Pharmacy</institution>, <institution>Sichuan Provincial People&#x2019;s Hospital</institution>, <institution>School of Medicine</institution>, <institution>University of Electronic Science and Technology of China</institution>, <addr-line>Chengdu</addr-line>, <addr-line>Sichuan</addr-line>, <country>China</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Chinese Academy of Sciences Sichuan Translational Medicine Research Hospital</institution>, <addr-line>Chengdu</addr-line>, <addr-line>Sichuan</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/546637/overview">Qiong Zhang</ext-link>, Albert Einstein College of Medicine, United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2255458/overview">Tianyi Zhang</ext-link>, Emory University, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2191047/overview">Yuan Gu</ext-link>, Incyte Corporation, United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1971355/overview">Shanye Yin</ext-link>, Albert Einstein College of Medicine, United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Xing-Wei Wu, <email>wuxingwei@med.uestc.edu.cn</email>; Meng-Ting Li, <email>limengting@uestc.edu.cn</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>30</day>
<month>06</month>
<year>2023</year>
</pub-date>
<pub-date pub-type="collection">
<year>2023</year>
</pub-date>
<volume>14</volume>
<elocation-id>1216182</elocation-id>
<history>
<date date-type="received">
<day>03</day>
<month>05</month>
<year>2023</year>
</date>
<date date-type="accepted">
<day>19</day>
<month>06</month>
<year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2023 Tong, Gao, Chang, Wu and Li.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Tong, Gao, Chang, Wu and Li</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>
<bold>Background:</bold> Glycosylated hemoglobin (HbA1c) is recommended for diagnosing and monitoring type 2 diabetes. However, the monitoring frequency in real-world applications has not yet reached the recommended frequency in the guidelines. Developing machine learning models to screen patients with poor glycemic control in patients with T2D could optimize management and decrease medical service costs.</p>
<p>
<bold>Methods:</bold> This study was carried out on patients with T2D who were examined for HbA1c at the Sichuan Provincial People&#x2019;s Hospital from April 2018 to December 2019. Characteristics were extracted from interviews and electronic medical records. The data (excluded FBG or included FBG) were randomly divided into a training dataset and a test dataset with a radio of 8:2 after data pre-processing. Four imputing methods, four screening methods, and six machine learning algorithms were used to optimize data and develop models. Models were compared on the basis of predictive performance metrics, especially on the model benefit (MB, a confusion matrix combined with economic burden associated with therapeutic inertia). The contributions of features were interpreted using SHapley Additive exPlanation (SHAP). Finally, we validated the sample size on the best model.</p>
<p>
<bold>Results:</bold> The study included 980 patients with T2D, of whom 513 (52.3%) were defined as positive (need to perform the HbA1c test). The results indicated that the model trained in the data (included FBG) presented better forecast performance than the models that excluded the FBG value. The best model used modified random forest as the imputation method, ElasticNet as the feature screening method, and the LightGBM algorithms and had the best performance. The MB, AUC, and AUPRC of the best model, among a total of 192 trained models, were 43475.750 (&#xa5;), 0.972, 0.944, and 0.974, respectively. The FBG values, previous HbA1c values, having a rational and reasonable diet, health status scores, type of manufacturers of metformin, interval of measurement, EQ-5D scores, occupational status, and age were the most significant contributors to the prediction model.</p>
<p>
<bold>Conclusion:</bold> We found that MB could be an indicator to evaluate the model prediction performance. The proposed model performed well in identifying patients with T2D who need to undergo the HbA1c test and could help improve individualized T2D management.</p>
</abstract>
<kwd-group>
<kwd>type 2 diabetes</kwd>
<kwd>glycosylated hemoglobin</kwd>
<kwd>prediction models</kwd>
<kwd>machine learning</kwd>
<kwd>model benefit</kwd>
</kwd-group>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content>
</contract-sponsor>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Experimental Pharmacology and Drug Discovery</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Diabetes mellitus (DM) is one of the most common and fastest-growing endocrine diseases, with both types (type 1 and type 2) contributing substantially to the healthcare costs of society. According to the International Diabetes Federation (IDF), the number of people with diabetes reached approximately 537 million worldwide by 2021 (1 in 10 adults live with diabetes), and approximately 90%&#x2013;95% of cases of diabetes suffer from type 2 diabetes (T2D) (<xref ref-type="bibr" rid="B36">Sun et al., 2022</xref>). T2D has become a global threat to public health in the 21st century (<xref ref-type="bibr" rid="B41">Wang et al., 2022</xref>). Fasting blood glucose (FBG) and random blood glucose (RBG) have been the traditional method for assessing the risk of T2D, but they have obvious shortcomings&#x2014;change over short periods of time due to behavioral changes (<xref ref-type="bibr" rid="B9">Christine et al., 2017</xref>). Relatively, glycated hemoglobin A1c (HbA1c), representing the average plasma glucose levels for the past 2&#x2013;3&#xa0;months (<xref ref-type="bibr" rid="B32">Rohlfing et al., 2002</xref>), has been recommended for diagnosing and monitoring diabetes by the World Health Organization (WHO) in 2011 and the American Diabetes Association (ADA) in 2010 (<xref ref-type="bibr" rid="B23">Leong et al., 2018</xref>).</p>
<p>According to the latest criteria, the American Diabetes Association (ADA) and the European Association for the Study of Diabetes (EASD) have recommended that glycemic management is evaluated primarily with the HbA1c test, and the therapeutic goal is to reduce the HbA1c to&#x3c;7.0% (<xref ref-type="bibr" rid="B11">Davies et al., 2022</xref>). The Chinese guidelines are in line with international consensus&#x2014;they stress the importance of regular HbA1c measurements (twice a year or four times a year) (<xref ref-type="bibr" rid="B8">Chinese Diabetes Society, 2021</xref>). Studies have shown that glycemic control is required in order to reduce the risk of onset and progression of complications (<xref ref-type="bibr" rid="B43">Williams et al., 2005</xref>; <xref ref-type="bibr" rid="B45">Yu et al., 2022</xref>). Once the target HbA1c is exceeded by 0.5% (&#x3e;5&#xa0;mmol/mol) after 3&#x2013;6&#xa0;months, further intensification should be administered. However, in practice, this does not always happen. The delay in intensifying therapy is referred to in clinical terms as therapeutic inertia and is due to underestimation of the need for therapy or failure to monitor the HbA1c level (<xref ref-type="bibr" rid="B31">Reach et al., 2017</xref>).</p>
<p>Machine learning (ML) is a branch of artificial intelligence and has been widely applied in clinical research and practice to construct high-performing prediction models, such as prediction of disease progression and outcomes (<xref ref-type="bibr" rid="B16">Griffith et al., 2020</xref>; <xref ref-type="bibr" rid="B24">Lewin-Epstein et al., 2020</xref>; <xref ref-type="bibr" rid="B40">Wang et al., 2020</xref>). Especially in the field of T2D management, identifying patients with T2D and estimating the risk of development of complications has become a hot topic during recent years (<xref ref-type="bibr" rid="B1">Ahlqvist et al., 2019</xref>; <xref ref-type="bibr" rid="B13">Dennis et al., 2019</xref>; <xref ref-type="bibr" rid="B18">Heerspink, 2019</xref>). ML has been shown to provide a useful management tool and has played a key role in the recognition of systems as routine therapeutic aids for patients with T2D. Thus, we consider whether it is possible to identify patients with a high risk of poor glycemic control utilizing machine learning methods based on the readily available daily data.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methods</title>
<sec id="s2-1">
<title>2.1 Data sources</title>
<p>The participants in the study were recruited from outpatients attending the Endocrinology Section of the Sichuan Provincial People&#x2019;s Hospital. Participants were selected according to the following criteria: (1) over 18 years of age; (2) diagnosed as a T2D patient and received hypoglycemic treatment (the diagnostic criteria for T2D were in line with China&#x2019;s 2017 guidelines on preventing and treating type 2 diabetes (<xref ref-type="bibr" rid="B7">Chinese Diabetes Society, 2017</xref>)); and (3) HbA1c levels were measured on the day of collection. (4) Researchers explained the purpose and scope of the survey to the subjects, and those who agreed to take part were retained in the study. Ethics approval was obtained through the Ethics Committee of the Sichuan Provincial People&#x2019;s Hospital (approval &#x23; 2018-53).</p>
<p>Characteristics of participants were obtained from face-to-face interviews and electronic medical records (EMRs). The adherence status was defined according to the proportion of days covered (PDC). PDC higher than 80% was regarded as good medication compliance (<xref ref-type="bibr" rid="B44">Wu et al., 2020</xref>).</p>
</sec>
<sec id="s2-2">
<title>2.2 Outcome definition</title>
<p>HbA1c values on the day of visiting the clinic were measured at the clinical laboratory of Sichuan Provincial People&#x2019;s Hospital and collected from EMRs. In this study, a value of HbA1c more than 7.0% was defined as positive and less than 7.0% was defined as negative. Furthermore, parents who had a positive HbA1c were considered to be needed for detection on the day of attending the Endocrinology Section.</p>
</sec>
<sec id="s2-3">
<title>2.3 Data pre-processing</title>
<p>After data collection ended, the information was converted to an Excel format. Each column represented a candidate variable, and each row represented a sample. To acquire high-quality data for modeling, a series of interventions were performed, including data pre-screening, data imputing, and variable selection.</p>
<p>First, data pre-screening was carried out using the following criteria: (1) the columns with missing values &#x3e; 90% were removed, (2) the columns with a single value occupying &#x3e;90% were removed, and (3) the columns with the coefficients of variation &#x3c;0.1 were removed.</p>
<p>Missing information was inevitable in clinical data, such as the FBG value and PBG value. Missing data were filled using four imputing methods, including simple imputing (marked as SI), random forest imputing (marked as RF), k-nearest neighbor imputing (marked as KNN), and optimal deletion (marked as OD).</p>
<p>In order to eliminate irrelevant variables, reduce the number of variables, and improve the accuracy of the model, variable selection was performed. In this study, four algorithms&#x2014;LASSO (<xref ref-type="bibr" rid="B38">Tibshirani, 1997</xref>), ridge regression (<xref ref-type="bibr" rid="B29">Marquardt and Snee, 1975</xref>), ElasticNet (<xref ref-type="bibr" rid="B34">Simon et al., 2011</xref>), and Boruta (<xref ref-type="bibr" rid="B21">Kursa M B, 2010</xref>)&#x2014;were used to screen the key variables. The four aforementioned algorithms were marked as LA, RD, EN, and BOR, respectively.</p>
</sec>
<sec id="s2-4">
<title>2.4 Data partition</title>
<p>80 % of the data were assigned as the training set and the rest as the test set. The training set was used to train a classification model, and the test set was used to evaluate the model performance. Meanwhile, to assess whether the FGB value on the day was the important variable, the original data with the FGB value were used to train the models.</p>
</sec>
<sec id="s2-5">
<title>2.5 Model building</title>
<p>Sixteen datasets were generated in the training set by four data imputation methods and four variable selection methods. Then, six machine learning algorithms were employed on each dataset, respectively, to develop a total of 112 models. Machine learning algorithms in this study included random forest (RF), logistic regression (LR), multilayer perceptron (MLP), extreme gradient boosting (XGBoost), light gradient boosting machine (LGBM), and categorical boosting (CB).</p>
<p>RF, an ensemble learning algorithm proposed by Breiman, is very commonly used for classification (<xref ref-type="bibr" rid="B5">Breiman, 2001</xref>). Individual decision trees are built using a random subset of the training dataset in the training process. The final classification is then based on the majority voting results of all decision trees (<xref ref-type="bibr" rid="B35">Singha et al., 2019</xref>).</p>
<p>LR is widely used to solve binary classification problems (<xref ref-type="bibr" rid="B20">Jaillard et al., 2020</xref>). It predicts the probability of whether a dependent variable belongs to a particular class. The principle of LR is to first fit the decision boundary and then establish the probability relationship between the boundary and the classification so as to obtain the probability in the case of two classifications (<xref ref-type="bibr" rid="B42">Wang et al., 2020</xref>).</p>
<p>MLP, also known as a feed-forward neural network, is one of the most common deep learning approaches (<xref ref-type="bibr" rid="B39">Wan et al., 2018</xref>). It is mainly used to address supervised learning problems by learning the dependencies between the input layer (the variables) and output layer (the classification decision) using a fully connected hidden layer (<xref ref-type="bibr" rid="B42">Wang et al., 2020</xref>).</p>
<p>XGBoost (<xref ref-type="bibr" rid="B37">Chen and Guestrin, 2016</xref>), LightGBM (<xref ref-type="bibr" rid="B17">Guolin et al., 2017</xref>), and CatBoost (<xref ref-type="bibr" rid="B3">Bent&#xe9;jac et al., 2021</xref>) were the three most popular implementations of gradient-boosting tree-based ensemble methods (<xref ref-type="bibr" rid="B14">Friedman, 2001</xref>). While built on structurally similar ideas, these libraries differ slightly on how decision trees are grown or how categorical variable data are handled, and only experimentation can validate which performs the best.</p>
</sec>
<sec id="s2-6">
<title>2.6 Model evaluation</title>
<p>The test set was used for external validation. A confusion matrix was used to evaluate the accuracy of classifier classification. In this study, a confusion matrix combined with relevant economic indicators, renamed as model benefit (MB), was used to redefine model performance to evaluate the accuracy of classifier classification. The test fee for HbA1c at our hospital was &#xa5;73 per test. The mean additional economic burden of therapeutic inertia (<xref ref-type="bibr" rid="B26">Lindvig et al., 2021</xref>) was regarded as the cost of missed detection. In accordance with the current exchange rate, the exchange rate of the renminbi (RMB, &#xa5;) against the Danish Krone is approximated to 1:1. The cost of missed detection was &#xa5;786.77. The calculation formula was as follows:<disp-formula id="equ1">
<mml:math id="m1">
<mml:mrow>
<mml:mi mathvariant="normal">M</mml:mi>
<mml:mi mathvariant="normal">B</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xa5;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">C</mml:mi>
<mml:mo>,</mml:mo>
<mml:mo>&#xa5;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="normal">M</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mi mathvariant="normal">M</mml:mi>
<mml:mi mathvariant="normal">C</mml:mi>
<mml:mo>,</mml:mo>
<mml:mo>&#xa5;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="equ2">
<mml:math id="m2">
<mml:mrow>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">C</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xa5;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">p</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">p</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mo>&#xd7;</mml:mo>
<mml:mi mathvariant="normal">H</mml:mi>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mn>1</mml:mn>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="equ3">
<mml:math id="m3">
<mml:mrow>
<mml:mi mathvariant="normal">M</mml:mi>
<mml:mi mathvariant="normal">C</mml:mi>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#xa5;</mml:mo>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mi mathvariant="normal">H</mml:mi>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mn>1</mml:mn>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mi mathvariant="normal">H</mml:mi>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mn>1</mml:mn>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mi mathvariant="normal">N</mml:mi>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">m</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">N</mml:mi>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>&#xd7;</mml:mo>
<mml:mi mathvariant="normal">H</mml:mi>
<mml:mi mathvariant="normal">b</mml:mi>
<mml:mi mathvariant="normal">A</mml:mi>
<mml:mn>1</mml:mn>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>,</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>
<disp-formula id="equ4">
<mml:math id="m4">
<mml:mrow>
<mml:mrow>
<mml:mfenced open="(" close=")" separators="|">
<mml:mrow>
<mml:mo>&#x2a;</mml:mo>
<mml:mo>:</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">u</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">p</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">v</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mi mathvariant="normal">P</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">p</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">v</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">F</mml:mi>
<mml:mi mathvariant="normal">N</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">f</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">s</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">g</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">v</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mo>,</mml:mo>
<mml:mi mathvariant="normal">T</mml:mi>
<mml:mi mathvariant="normal">N</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">u</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">g</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">v</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
</mml:mrow>
</mml:mfenced>
</mml:mrow>
<mml:mo>.</mml:mo>
</mml:mrow>
</mml:math>
</disp-formula>In addition, the area under the receiver operating characteristic curve (AUC), area under the precision recall curve (AUPRC), and decision curve analysis (DCA) were summarized to assess the model performance. The contribution of each variable to the predictive model was estimated with SHapley Additive exPlanation (SHAP).</p>
</sec>
<sec id="s2-7">
<title>2.7 Sample size validation</title>
<p>The best model (assessed by MB) was employed to estimate the impact of sample sizes on the predictive performance (<xref ref-type="bibr" rid="B44">Wu et al., 2020</xref>). The total samples were randomly separated into the training set and the test set at a ratio of 8:2. First, 10% of the training set was extracted to train the model, and the AUC was evaluated in the test set. The selected samples from the training set increased from 10% to 100% with a stepwise increase of 10%. These steps were repeated 10 times to generate 10 independent repeated AUC values. The relationship of sample size with the prediction performance of models was assessed according to the inflection point change of the line graph. The steeper broken line indicated that a larger sample size would improve the prediction performance of the model, and the gentler slope indicated that the performance of models was affected a little by the sample size.</p>
<p>Above all, the concise workflow for the development and validation of models is summarized in <xref ref-type="fig" rid="F1">Figure 1</xref>.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Overview of the main modeling steps.</p>
</caption>
<graphic xlink:href="fphar-14-1216182-g001.tif"/>
</fig>
</sec>
<sec id="s2-8">
<title>2.8 Statistical analysis</title>
<p>The continuous variables were described by mean and standard deviation, whereas categorical variables were expressed in terms of frequencies and percentages. Multivariate analyses were performed to identify the factors associated with the model performance. Multivariate analysis was performed by multi-linear regression analysis. Model development was performed using the <italic>sklearn</italic> package and SHAP package in Python (<italic>Python</italic> Software Foundation, Python Language Reference, version 3.6.8) on PyCharm (developed by JetBrains.r.o., version 11.0.4). The grid search technique was applied to calculate hyperparameter values optimally.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Participant characteristics</title>
<p>Overall, 980 patients completed the survey, among which 571 were male and 409 were female. The mean age was 59.2 &#xb1; 11.9&#xa0;years. A total of 513 patients were defined as positive (52.3%). Participants were grouped according to the HbA1c value, and detailed characteristics of the participants are shown in <xref ref-type="table" rid="T1">Table 1</xref>.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Characteristics of participants when grouped according to HbA1c.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Variable</th>
<th align="left">Identifier</th>
<th align="left">Parameter</th>
<th align="left">Total</th>
<th align="left">HbA1c &#x2264; 7.0</th>
<th align="left">HbA1c &#x3e; 7.0</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">HbA<sub>1c</sub> values</td>
<td align="left"/>
<td align="left"/>
<td align="left">980 (100%)</td>
<td align="left">467 (47.7%)</td>
<td align="left">513 (52.3%)</td>
</tr>
<tr>
<td align="center">Age</td>
<td align="right">X1</td>
<td align="left"/>
<td align="left">59.2 &#xb1; 11.9</td>
<td align="left">58.3 &#xb1; 12.0</td>
<td align="left">59.9 &#xb1; 11.8</td>
</tr>
<tr>
<td align="center">Nationality</td>
<td align="right">X2</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Han</td>
<td align="left">945 (96.5%)</td>
<td align="left">456 (97.6%)</td>
<td align="left">489 (95.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Tibetan</td>
<td align="left">31 (3.2%)</td>
<td align="left">9 (1.9%)</td>
<td align="left">22 (4.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Qiang</td>
<td align="left">3 (0.3%)</td>
<td align="left">1 (0.2%)</td>
<td align="left">2 (0.4%)</td>
</tr>
<tr>
<td align="center">Gender</td>
<td align="right">X3</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Male</td>
<td align="left">571 (58.3%)</td>
<td align="left">267 (57.2%)</td>
<td align="left">304 (59.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Female</td>
<td align="left">409 (41.7%)</td>
<td align="left">200 (42.8%)</td>
<td align="left">209 (40.7%)</td>
</tr>
<tr>
<td align="center">Waistline (cm)</td>
<td align="right">X4</td>
<td align="left"/>
<td align="left">85.3 &#xb1; 9.5</td>
<td align="left">85.0 &#xb1; 9.8</td>
<td align="left">85.5 &#xb1; 9.3</td>
</tr>
<tr>
<td align="center">BMI (kg/m<sup>2</sup>)</td>
<td align="right">X5</td>
<td align="left"/>
<td align="left">24.3 &#xb1; 3.3</td>
<td align="left">24.4 &#xb1; 3.6</td>
<td align="left">24.18 &#xb1; 3.1</td>
</tr>
<tr>
<td align="center">Marital status</td>
<td align="right">X6</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Unmarried</td>
<td align="left">9 (0.9%)</td>
<td align="left">7 (1.5%)</td>
<td align="left">2 (0.4%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Married</td>
<td align="left">940 (96.3%)</td>
<td align="left">447 (95.7%)</td>
<td align="left">493 (96.1%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Divorced</td>
<td align="left">4 (0.4%)</td>
<td align="left">1 (0.2%)</td>
<td align="left">3 (0.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Widowed</td>
<td align="left">23 (2.4%)</td>
<td align="left">9 (1.9%)</td>
<td align="left">14 (2.7%)</td>
</tr>
<tr>
<td align="center">Occupational status</td>
<td align="right">X7</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Unemployed</td>
<td align="left">133 (13.6%)</td>
<td align="left">49 (10.5%)</td>
<td align="left">84 (16.4%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Employed</td>
<td align="left">358 (36.6%)</td>
<td align="left">181 (38.8%)</td>
<td align="left">177 (34.5%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Retirement</td>
<td align="left">482 (49.3%)</td>
<td align="left">234 (50.1%)</td>
<td align="left">248 (48.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Others</td>
<td align="left">5 (0.5%)</td>
<td align="left">1 (0.2%)</td>
<td align="left">4 (0.8%)</td>
</tr>
<tr>
<td align="center">Education level</td>
<td align="right">X8</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Illiteracy</td>
<td align="left">92 (9.4%)</td>
<td align="left">31 (6.6%)</td>
<td align="left">61 (11.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Junior middle school</td>
<td align="left">366 (37.4%)</td>
<td align="left">175 (37.5%)</td>
<td align="left">191 (37.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">High school or special secondary school</td>
<td align="left">264 (27.0%)</td>
<td align="left">125 (26.8%)</td>
<td align="left">139 (27.1%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">College and above educational level</td>
<td align="left">256 (26.2%)</td>
<td align="left">136 (29.1%)</td>
<td align="left">120 (23.4%)</td>
</tr>
<tr>
<td align="center">Family history of diabetes mellitus</td>
<td align="right">X9</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">629 (64.8%)</td>
<td align="left">304 (65.1%)</td>
<td align="left">325 (63.4%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">341 (35.2%)</td>
<td align="left">157 (33.6%)</td>
<td align="left">184 (35.9%)</td>
</tr>
<tr>
<td align="center">Medicare status</td>
<td align="right">X10</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Non-reimbursement</td>
<td align="left">233 (45.0%)</td>
<td align="left">122 (26.1%)</td>
<td align="left">111 (21.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Reimbursement</td>
<td align="left">285 (55.0%)</td>
<td align="left">132 (28.3%)</td>
<td align="left">153 (29.8%)</td>
</tr>
<tr>
<td align="center">Previous HbA<sub>1c</sub> values (%)</td>
<td align="right">X11</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">&#x2264;7%</td>
<td align="left">269 (39.8%)</td>
<td align="left">216 (46.3%)</td>
<td align="left">53 (10.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">7%&#x2013;9%</td>
<td align="left">328 (48.5%)</td>
<td align="left">118 (25.3%)</td>
<td align="left">210 (40.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">&#x3e;9%</td>
<td align="left">79 (11.7%)</td>
<td align="left">16 (3.4%)</td>
<td align="left">63 (12.3%)</td>
</tr>
<tr>
<td align="center">Interval of measurement (in days)</td>
<td align="right">X12</td>
<td align="left"/>
<td align="left">212.5 &#xb1; 213.7</td>
<td align="left">186.1 &#xb1; 168.9</td>
<td align="left">243.5 &#xb1; 253.4</td>
</tr>
<tr>
<td align="center">Course of diabetes (in months)</td>
<td align="right">X13</td>
<td align="left"/>
<td align="left">90.3 &#xb1; 76.5</td>
<td align="left">71.9 &#xb1; 68.0</td>
<td align="left">107.0 &#xb1; 80.0</td>
</tr>
<tr>
<td align="center">Frequency of FBG measurements</td>
<td align="right">X14</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Irregular measurements</td>
<td align="left">139 (14.2%)</td>
<td align="left">59 (12.6%)</td>
<td align="left">80 (15.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Two to three times a week</td>
<td align="left">323 (33.0%)</td>
<td align="left">159 (34.0%)</td>
<td align="left">164 (32.0%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Three to four times a month</td>
<td align="left">400 (40.8%)</td>
<td align="left">197 (42.2%)</td>
<td align="left">203 (39.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Two to three times per 3&#xa0;months</td>
<td align="left">118 (12.0%)</td>
<td align="left">52 (11.1%)</td>
<td align="left">66 (12.87)</td>
</tr>
<tr>
<td align="center">Duration of treatment regimen (in months)</td>
<td align="right">X15</td>
<td align="left"/>
<td align="left">24.8 &#xb1; 34.0</td>
<td align="left">21.7 &#xb1; 29.3</td>
<td align="left">27.6 &#xb1; 37.5</td>
</tr>
<tr>
<td align="center">Number of oral drugs</td>
<td align="right">X16</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0</td>
<td align="left">71 (7.2%)</td>
<td align="left">16 (3.4%)</td>
<td align="left">55 (10.7%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">1</td>
<td align="left">328 (33.5%)</td>
<td align="left">173 (37.0%)</td>
<td align="left">155 (30.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">2</td>
<td align="left">419 (42.8%)</td>
<td align="left">190 (40.7%)</td>
<td align="left">229 (44.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">3</td>
<td align="left">153 (15.6%)</td>
<td align="left">81 (17.3%)</td>
<td align="left">72 (14.0%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">4</td>
<td align="left">8 (0.8%)</td>
<td align="left">7 (1.5%)</td>
<td align="left">1 (0.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">5</td>
<td align="left">1 (0.1%)</td>
<td align="left">0</td>
<td align="left">1 (0.2%)</td>
</tr>
<tr>
<td align="center">Type of insulin used</td>
<td align="right">X17</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0</td>
<td align="left">731 (74.6%)</td>
<td align="left">383 (82.0%)</td>
<td align="left">348 (67.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">1</td>
<td align="left">228 (23.3%)</td>
<td align="left">80 (17.1%)</td>
<td align="left">148 (28.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">2</td>
<td align="left">21 (2.1%)</td>
<td align="left">4 (0.9%)</td>
<td align="left">17 (3.3%)</td>
</tr>
<tr>
<td align="center">Use of other types of drugs</td>
<td align="right">X18</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">None</td>
<td align="left">804 (82.1%)</td>
<td align="left">392 (83.9%)</td>
<td align="left">412 (80.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">National medicine</td>
<td align="left">11 (1.1%)</td>
<td align="left">1 (0.2%)</td>
<td align="left">10 (2.0%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Chinese medicine</td>
<td align="left">88 (9.0%)</td>
<td align="left">41 (8.8%)</td>
<td align="left">47 (9.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Healthcare products</td>
<td align="left">71 (7.3%)</td>
<td align="left">31 (6.6%)</td>
<td align="left">40 (7.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Others</td>
<td align="left">5 (0.5%)</td>
<td align="left">2 (0.4%)</td>
<td align="left">3 (0.6%)</td>
</tr>
<tr>
<td align="center">Type of operation or other communicable diseases</td>
<td align="right">X19</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">775 (79.2%)</td>
<td align="left">372 (80.0%)</td>
<td align="left">403 (78.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Abdominal surgery</td>
<td align="left">114 (11.6%)</td>
<td align="left">48 (10.3%)</td>
<td align="left">66 (12.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Thoracic surgery</td>
<td align="left">31 (3.2%)</td>
<td align="left">16 (3.4%)</td>
<td align="left">15 (2.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Others</td>
<td align="left">59 (6.0%)</td>
<td align="left">31 (6.6%)</td>
<td align="left">28 (5.5%)</td>
</tr>
<tr>
<td align="center">Number of comorbid diseases</td>
<td align="right">X20</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0</td>
<td align="left">500 (51.1%)</td>
<td align="left">229 (49.0%)</td>
<td align="left">271 (52.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">1</td>
<td align="left">299 (30.5%)</td>
<td align="left">145 (31.0%)</td>
<td align="left">154 (30.0%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">2</td>
<td align="left">143 (14.6%)</td>
<td align="left">73 (15.6%)</td>
<td align="left">70 (13.7%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">3</td>
<td align="left">34 (3.5%)</td>
<td align="left">19 (4.1%)</td>
<td align="left">15 (2.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">4</td>
<td align="left">3 (0.3%)</td>
<td align="left">1 (0.2%)</td>
<td align="left">2 (0.4%)</td>
</tr>
<tr>
<td align="center">Hypertension</td>
<td align="right">X21</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">663 (67.7%)</td>
<td align="left">311 (66.6%)</td>
<td align="left">352 (68.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">317 (32.3%)</td>
<td align="left">156 (33.4%)</td>
<td align="left">161 (31.4%)</td>
</tr>
<tr>
<td align="center">Hyperlipidemia</td>
<td align="right">X22</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">768 (78.4%)</td>
<td align="left">364 (77.9%)</td>
<td align="left">404 (78.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">211 (21.6%)</td>
<td align="left">103 (22.1%)</td>
<td align="left">108 (21.0%)</td>
</tr>
<tr>
<td align="center">With or without complications</td>
<td align="right">X23</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">884 (90.2%)</td>
<td align="left">411 (88.0%)</td>
<td align="left">473 (92.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">96 (9.8%)</td>
<td align="left">56 (12.0%)</td>
<td align="left">40 (7.8%)</td>
</tr>
<tr>
<td align="center">Vascular complications</td>
<td align="right">X24</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">977 (99.7%)</td>
<td align="left">465 (99.6%)</td>
<td align="left">512 (99.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">3 (0.3%)</td>
<td align="left">2 (0.4%)</td>
<td align="left">1 (0.2%)</td>
</tr>
<tr>
<td align="center">Neurological complications</td>
<td align="right">X25</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">926 (94.5%)</td>
<td align="left">434 (92.9%)</td>
<td align="left">492 (95.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">54 (5.5%)</td>
<td align="left">33 (7.1%)</td>
<td align="left">21 (4.1%)</td>
</tr>
<tr>
<td align="center">Complications with lesions of the extremities</td>
<td align="right">X26</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">975 (99.5%)</td>
<td align="left">466 (99.8%)</td>
<td align="left">509 (99.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">5 (0.5%)</td>
<td align="left">1 (0.2%)</td>
<td align="left">4 (0.8%)</td>
</tr>
<tr>
<td align="center">Ocular complications</td>
<td align="right">X27</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">973 (99.3%)</td>
<td align="left">465 (99.6%)</td>
<td align="left">508 (99.0%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">7 (0.7%)</td>
<td align="left">2 (0.4%)</td>
<td align="left">5 (1.0%)</td>
</tr>
<tr>
<td align="center">Nephropathy complications</td>
<td align="right">X28</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">972 (99.2%)</td>
<td align="left">461 (98.7%)</td>
<td align="left">511 (99.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">8 (0.8%)</td>
<td align="left">6 (1.3%)</td>
<td align="left">2 (0.4%)</td>
</tr>
<tr>
<td align="center">Complications (other diseases)</td>
<td align="right">X29</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">957 (97.7%)</td>
<td align="left">453 (97.0%)</td>
<td align="left">504 (98.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">23 (2.3%)</td>
<td align="left">14 (3.0%)</td>
<td align="left">9 (1.7%)</td>
</tr>
<tr>
<td align="center">Intensity of exercise</td>
<td align="right">X30</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">None</td>
<td align="left">153 (15.6%)</td>
<td align="left">51 (10.9%)</td>
<td align="left">102 (19.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Low intensity</td>
<td align="left">664 (67.8%)</td>
<td align="left">321 (68.7%)</td>
<td align="left">343 (66.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Moderate intensity</td>
<td align="left">124 (12.7%)</td>
<td align="left">76 (16.3%)</td>
<td align="left">48 (9.4%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">High intensity</td>
<td align="left">39 (3.9%)</td>
<td align="left">19 (4.1%)</td>
<td align="left">20 (3.9%)</td>
</tr>
<tr>
<td align="center">Exercise session (mins/day)</td>
<td align="right">X31</td>
<td align="left"/>
<td align="left">53.4 &#xb1; 55.4</td>
<td align="left">53.5 &#xb1; 42.1</td>
<td align="left">53.3 &#xb1; 65.3</td>
</tr>
<tr>
<td align="center">Have a rational and reasonable diet</td>
<td align="right">X32</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">256 (26.1%)</td>
<td align="left">70 (15.0%)</td>
<td align="left">186 (36.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">724 (73.9%)</td>
<td align="left">397 (85.0%)</td>
<td align="left">327 (63.7%)</td>
</tr>
<tr>
<td align="center">Sleep duration</td>
<td align="right">X33</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Good</td>
<td align="left">453 (46.2%)</td>
<td align="left">223 (47.8%)</td>
<td align="left">230 (44.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Ordinary</td>
<td align="left">333 (34.0%)</td>
<td align="left">154 (33.0%)</td>
<td align="left">179 (34.9%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Lose sleep</td>
<td align="left">194 (19.8%)</td>
<td align="left">90 (19.3%)</td>
<td align="left">104 (20.3%)</td>
</tr>
<tr>
<td align="center">Psychological status</td>
<td align="right">X34</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Well</td>
<td align="left">459 (46.8%)</td>
<td align="left">230 (49.3%)</td>
<td align="left">229 (44.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">General</td>
<td align="left">493 (50.3%)</td>
<td align="left">225 (48.2%)</td>
<td align="left">268 (52.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Depression</td>
<td align="left">28 (2.9%)</td>
<td align="left">12 (2.5%)</td>
<td align="left">16 (3.1%)</td>
</tr>
<tr>
<td align="center">Health status scores (%)</td>
<td align="right">X35</td>
<td align="left"/>
<td align="left">77.3 &#xb1; 10.8</td>
<td align="left">78.3 &#xb1; 11.2</td>
<td align="left">76.4 &#xb1; 10.3</td>
</tr>
<tr>
<td align="center">EQ-5D scores</td>
<td align="right">X36</td>
<td align="left"/>
<td align="left">0.9 &#xb1; 0.1</td>
<td align="left">0.9 &#xb1; 0.1</td>
<td align="left">0.9 &#xb1; 0.1</td>
</tr>
<tr>
<td align="center">Medication adherence</td>
<td align="right">X37</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">183 (18.6%)</td>
<td align="left">47 (10.1%)</td>
<td align="left">137 (26.7%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">797 (83.4%)</td>
<td align="left">420 (89.9%)</td>
<td align="left">376 (73.3%)</td>
</tr>
<tr>
<td align="center">Use of metformin</td>
<td align="right">X38</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">None</td>
<td align="left">313 (32.0%)</td>
<td align="left">127 (27.2%)</td>
<td align="left">186 (36.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Once a day</td>
<td align="left">175 (17.9%)</td>
<td align="left">97 (20.8%)</td>
<td align="left">78 (15.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Twice a day</td>
<td align="left">399 (40.8%)</td>
<td align="left">198 (42.4%)</td>
<td align="left">201 (39.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Three times a day</td>
<td align="left">92 (9.3%)</td>
<td align="left">44 (9.4%)</td>
<td align="left">48 (9.4%)</td>
</tr>
<tr>
<td align="center">Dose of metformin</td>
<td align="right">X39</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">None</td>
<td align="left">313 (32.1%)</td>
<td align="left">127 (27.2%)</td>
<td align="left">186 (36.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0.25&#xa0;g</td>
<td align="left">50 (5.1%)</td>
<td align="left">18 (3.9%)</td>
<td align="left">32 (6.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0.425&#xa0;g</td>
<td align="left">2 (0.2%)</td>
<td align="left">2 (0.4%)</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0.5&#xa0;g</td>
<td align="left">154 (15.8%)</td>
<td align="left">60 (12.9%)</td>
<td align="left">94 (18.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0.75&#xa0;g</td>
<td align="left">1 (0.1%)</td>
<td align="left">0</td>
<td align="left">1 (0.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0.85&#xa0;g</td>
<td align="left">447 (45.8%)</td>
<td align="left">256 (54.8%)</td>
<td align="left">191 (37.2%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">1.0&#xa0;g</td>
<td align="left">9 (0.9%)</td>
<td align="left">2 (0.4%)</td>
<td align="left">7 (1.4%)</td>
</tr>
<tr>
<td align="center">Type of manufacturers of metformin</td>
<td align="right">X40</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Unknown</td>
<td align="left">313 (32.1%)</td>
<td align="left">127 (27.2%)</td>
<td align="left">186 (36.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Generic drugs</td>
<td align="left">205 (21.0%)</td>
<td align="left">75 (16.1%)</td>
<td align="left">130 (25.3%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Guthentic drugs</td>
<td align="left">458 (46.9%)</td>
<td align="left">264 (56.5%)</td>
<td align="left">194 (37.8%)</td>
</tr>
<tr>
<td align="center">&#x3b1;-Glucosidase inhibitors</td>
<td align="right">X41</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">616 (62.9%)</td>
<td align="left">290 (62.1%)</td>
<td align="left">326 (63.5%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">364 (37.1%)</td>
<td align="left">177 (37.9%)</td>
<td align="left">187 (36.5%)</td>
</tr>
<tr>
<td align="center">Sulfonylureas</td>
<td align="right">X42</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">637 (65.0%)</td>
<td align="left">316 (67.7%)</td>
<td align="left">321 (62.6%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">343 (35.0%)</td>
<td align="left">151 (32.3%)</td>
<td align="left">192 (37.4%)</td>
</tr>
<tr>
<td align="center">Glinides</td>
<td align="right">X43</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">911 (93.0%)</td>
<td align="left">439 (94.0%)</td>
<td align="left">472 (92.0%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">69 (7.0%)</td>
<td align="left">28 (6.0%)</td>
<td align="left">41 (8.0%)</td>
</tr>
<tr>
<td align="center">DPP-4 inhibitors</td>
<td align="right">X44</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">845 (86.2%)</td>
<td align="left">379 (81.2%)</td>
<td align="left">466 (90.8%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">135 (13.8%)</td>
<td align="left">88 (18.8%)</td>
<td align="left">47 (9.2%)</td>
</tr>
<tr>
<td align="center">Thiazolidinediones</td>
<td align="right">X45</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">928 (94.7%)</td>
<td align="left">438 (93.79%)</td>
<td align="left">490 (95.52%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">52 (5.3%)</td>
<td align="left">29 (6.21%)</td>
<td align="left">23 (4.48%)</td>
</tr>
<tr>
<td align="center">GLP-1 RAs</td>
<td align="right">X46</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">979 (99.9%)</td>
<td align="left">466 (99.79%)</td>
<td align="left">513 (100.00%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">1 (0.1%)</td>
<td align="left">1 (0.21%)</td>
<td align="left">0</td>
</tr>
<tr>
<td align="center">SGLT2 inhibitors</td>
<td align="right">X47</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">976 (99.6%)</td>
<td align="left">464 (99.36%)</td>
<td align="left">512 (99.81%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">4 (0.4%)</td>
<td align="left">3 (0.64%)</td>
<td align="left">1 (0.19%)</td>
</tr>
<tr>
<td align="center">Use of Chinese medicine</td>
<td align="right">X48</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">974 (99.4%)</td>
<td align="left">467 (100.00%)</td>
<td align="left">507 (98.83%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">6 (0.6%)</td>
<td align="left">0</td>
<td align="left">6 (1.17%)</td>
</tr>
<tr>
<td align="center">Use of insulin</td>
<td align="right">X49</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">No</td>
<td align="left">744 (75.9%)</td>
<td align="left">385 (82.44%)</td>
<td align="left">359 (69.98%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">Yes</td>
<td align="left">236 (24.1%)</td>
<td align="left">82 (17.56%)</td>
<td align="left">154 (30.02%)</td>
</tr>
<tr>
<td align="center">Dose of non-basal insulin in the morning (U)</td>
<td align="right">X50</td>
<td align="left"/>
<td align="left">2.2 &#xb1; 5.8</td>
<td align="left">1.35 &#xb1; 4.76</td>
<td align="left">2.95 &#xb1; 6.46</td>
</tr>
<tr>
<td align="center">Dose of non-basal insulin in the noon (U)</td>
<td align="right">X51</td>
<td align="left"/>
<td align="left">0.4 &#xb1; 2.5</td>
<td align="left">0.25 &#xb1; 2.19</td>
<td align="left">0.55 &#xb1; 2.76</td>
</tr>
<tr>
<td align="center">Dose of non-basal insulin in the afternoon (U)</td>
<td align="right">X52</td>
<td align="left"/>
<td align="left">2.2 &#xb1; 5.7</td>
<td align="left">1.36 &#xb1; 4.67</td>
<td align="left">2.93 &#xb1; 6.42</td>
</tr>
<tr>
<td align="center">Dose of basal insulin (U)</td>
<td align="right">X53</td>
<td align="left"/>
<td align="left">2.0 &#xb1; 5.7</td>
<td align="left">1.25 &#xb1; 4.13</td>
<td align="left">2.68 &#xb1; 6.78</td>
</tr>
<tr>
<td align="center">Times of insulin use</td>
<td align="right">X54</td>
<td align="left"/>
<td align="left"/>
<td align="left"/>
<td align="left"/>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">0</td>
<td align="left">730 (74.5%)</td>
<td align="left">381 (81.58%)</td>
<td align="left">349 (68.03%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">1</td>
<td align="left">104 (10.6%)</td>
<td align="left">45 (9.64%)</td>
<td align="left">59 (11.50%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">2</td>
<td align="left">112 (11.4%)</td>
<td align="left">33 (7.07%)</td>
<td align="left">79 (15.40%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">3</td>
<td align="left">15 (1.5%)</td>
<td align="left">5 (1.07%)</td>
<td align="left">10 (1.95%)</td>
</tr>
<tr>
<td align="left"/>
<td align="left"/>
<td align="left">4</td>
<td align="left">19 (2.0%)</td>
<td align="left">3 (0.64%)</td>
<td align="left">16 (3.12%)</td>
</tr>
<tr>
<td align="center">Present FBG values (mmoL/L)</td>
<td align="right">X55</td>
<td align="left">
</td>
<td align="left">9.3 &#xb1; 3.56</td>
<td align="left">7.12 &#xb1; 1.45</td>
<td align="left">10.73 &#xb1; 3.81</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>BMI: body mass index. HbA1c: glycated hemoglobin. FBG: fasting blood glucose. RBG: random blood glucose. EQ-5D: EuroQol five-dimension questionnaire. DPP-4 inhibitors: dipeptidylpeptidase-4 inhibitors. GLP-1 Ras: glucagon-like peptide-1 receptor agonists. SGLT2 inhibitors: sodium-dependent glucose transporters 2 inhibitors.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>After data pre-screening, 15 variables were removed (nationality, marital status, with or without complications, vascular complications, neurological complications, complications with lesions of the extremities, ocular complications, nephropathy complications, complications (other diseases), glinides, thiazolidinediones, GLP-1 Ras, SGLT2 inhibitors, SGLT2 inhibitors, and the use of Chinese medicine).</p>
</sec>
<sec id="s3-2">
<title>3.2 Dataset building</title>
<p>A total of 60 datasets were set up by applying different imputing methods and variable selection methods with 41 variables. The different numbers of variables and samples in each dataset are listed in <xref ref-type="table" rid="T2">Table 2</xref>.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Detailed information of 16 datasets.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Number</th>
<th align="center">Imputing methods</th>
<th align="center">Screening methods</th>
<th align="center">Number of variables</th>
<th align="center">Number of train samples</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="center">1</td>
<td align="center">KNN</td>
<td align="center">BOR</td>
<td align="center">14</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">2</td>
<td align="center">KNN</td>
<td align="center">EN</td>
<td align="center">33</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">3</td>
<td align="center">KNN</td>
<td align="center">LA</td>
<td align="center">33</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">4</td>
<td align="center">KNN</td>
<td align="center">RD</td>
<td align="center">16</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">5</td>
<td align="center">OD</td>
<td align="center">BOR</td>
<td align="center">12</td>
<td align="center">767</td>
</tr>
<tr>
<td align="center">6</td>
<td align="center">OD</td>
<td align="center">EN</td>
<td align="center">29</td>
<td align="center">767</td>
</tr>
<tr>
<td align="center">7</td>
<td align="center">OD</td>
<td align="center">LA</td>
<td align="center">29</td>
<td align="center">767</td>
</tr>
<tr>
<td align="center">8</td>
<td align="center">OD</td>
<td align="center">RD</td>
<td align="center">18</td>
<td align="center">767</td>
</tr>
<tr>
<td align="center">9</td>
<td align="center">RF</td>
<td align="center">BOR</td>
<td align="center">13</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">10</td>
<td align="center">RF</td>
<td align="center">EN</td>
<td align="center">33</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">11</td>
<td align="center">RF</td>
<td align="center">LA</td>
<td align="center">33</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">12</td>
<td align="center">RF</td>
<td align="center">RD</td>
<td align="center">17</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">13</td>
<td align="center">SI</td>
<td align="center">BOR</td>
<td align="center">14</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">14</td>
<td align="center">SI</td>
<td align="center">EN</td>
<td align="center">33</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">15</td>
<td align="center">SI</td>
<td align="center">LA</td>
<td align="center">33</td>
<td align="center">784</td>
</tr>
<tr>
<td align="center">16</td>
<td align="center">SI</td>
<td align="center">RD</td>
<td align="center">16</td>
<td align="center">784</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-3">
<title>3.3 Model validation</title>
<p>A total of 192 models (whether they included FBG or not) were validated in the test set, considered as external validation, and the performance metrics were output. As shown in <xref ref-type="table" rid="T3">Table 3</xref>; <xref ref-type="fig" rid="F2">Figure 2</xref>, the five best models (excluded FBG) were listed in sequence according to the MB value. The five best models were trained in the No. 12 dataset (applied modified random forest as the imputing method and Ridge as the selection method). The MB, AUC, accuracy, and AUPRC values of the best model (model 1) were 3163.800 (&#xa5;), 0.852, 0.811, and 0.845, respectively.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>Summary of the performance of the five best models (excluded the FBG value).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">ID</th>
<th align="center">Algorithms</th>
<th align="center">No. of datasets</th>
<th align="center">Parameters</th>
<th align="center">MC(&#xa5;)</th>
<th align="center">AUC</th>
<th align="center">Accuracy</th>
<th align="center">AUPRC</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="center">Model 1</td>
<td rowspan="2" align="center">LGBM</td>
<td rowspan="2" align="center">12</td>
<td align="center">Max depth &#x3d; 1</td>
<td rowspan="2" align="center">3163.800</td>
<td rowspan="2" align="center">0.852</td>
<td rowspan="2" align="center">0.811</td>
<td rowspan="2" align="center">0.845</td>
</tr>
<tr>
<td align="center">Subsample &#x3d; 0.1</td>
</tr>
<tr>
<td align="center">Model 2</td>
<td align="center">CB</td>
<td align="center">12</td>
<td align="center">N estimators &#x3d; 96</td>
<td align="center">&#x2212;13950.450</td>
<td align="center">0.850</td>
<td align="center">0.791</td>
<td align="center">0.840</td>
</tr>
<tr>
<td align="center">Model 3</td>
<td align="center">RF</td>
<td align="center">12</td>
<td align="center">N estimators &#x3d; 197</td>
<td align="center">&#x2212;14031.600</td>
<td align="center">0.840</td>
<td align="center">0.770</td>
<td align="center">0.839</td>
</tr>
<tr>
<td align="center">Model 4</td>
<td align="center">MLP</td>
<td align="center">12</td>
<td align="center">Activation &#x3d; tanh; hidden layer sizes&#x3d; (100, 50, 1); solver &#x3d; sgd</td>
<td align="center">&#x2212;16221.600</td>
<td align="center">0.816</td>
<td align="center">0.755</td>
<td align="center">0.824</td>
</tr>
<tr>
<td align="center">Model 5</td>
<td align="center">XGB</td>
<td align="center">12</td>
<td align="center">Gamma &#x3d; 0.1; max depth &#x3d; 3; subsample &#x3d; 0.7</td>
<td align="center">&#x2212;18249.300</td>
<td align="center">0.848</td>
<td align="center">0.781</td>
<td align="center">0.861</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Performance of the five best models (excluded FBG). <bold>(A)</bold> ROC curves. <bold>(B)</bold> Precision&#x2013;recall curves. <bold>(C)</bold> Calibration plots. <bold>(D)</bold> DCA plots.</p>
</caption>
<graphic xlink:href="fphar-14-1216182-g002.tif"/>
</fig>
<p>As listed in <xref ref-type="table" rid="T4">Table 4</xref>; <xref ref-type="fig" rid="F3">Figure 3</xref>, the five best models (included FBG) were trained in No. 11 and No. 10 datasets (applied modified random forest as the imputing method and ElasticNet or LASSO as the selection method). The MB, AUC, accuracy, and AUPRC values of the best model (model 1) were 43475.750 (&#xa5;), 0.972, 0.944, and 0.974, respectively. The calibration and DCA curves also displayed excellent predictive performances (<xref ref-type="fig" rid="F2">Figures 2C, D</xref>; <xref ref-type="fig" rid="F3">Figures 3C, D</xref>). The model that included FBG produced superior forecast performance compared to the model that excluded the FBG value.</p>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>Summary of the performance of the five best models (included the FBG value).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">ID</th>
<th align="center">Algorithms</th>
<th align="center">No. of datasets</th>
<th align="center">Parameters</th>
<th align="center">MC(&#xa5;)</th>
<th align="center">AUC</th>
<th align="center">Accuracy</th>
<th align="center">AUPRC</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="center">Model 1</td>
<td rowspan="2" align="center">LGBM</td>
<td rowspan="2" align="center">10</td>
<td align="center">Max depth &#x3d; 5</td>
<td rowspan="2" align="center">43475.750</td>
<td rowspan="2" align="center">0.972</td>
<td rowspan="2" align="center">0.944</td>
<td rowspan="2" align="center">0.974</td>
</tr>
<tr>
<td align="center">Subsample &#x3d; 0.1</td>
</tr>
<tr>
<td align="center">Model 2</td>
<td align="center">CB</td>
<td align="center">10</td>
<td align="center">N estimators &#x3d; 67</td>
<td align="center">43475.750</td>
<td align="center">0.971</td>
<td align="center">0.944</td>
<td align="center">0.978</td>
</tr>
<tr>
<td rowspan="2" align="center">Model 3</td>
<td rowspan="2" align="center">LGBM</td>
<td rowspan="2" align="center">11</td>
<td align="center">Max depth &#x3d; 5</td>
<td rowspan="2" align="center">43475.750</td>
<td rowspan="2" align="center">0.972</td>
<td rowspan="2" align="center">0.944</td>
<td rowspan="2" align="center">0.974</td>
</tr>
<tr>
<td align="center">Subsample &#x3d; 0.1</td>
</tr>
<tr>
<td align="center">Model 4</td>
<td align="center">CB</td>
<td align="center">11</td>
<td align="center">N estimators &#x3d; 67</td>
<td align="center">43475.750</td>
<td align="center">0.971</td>
<td align="center">0.944</td>
<td align="center">0.978</td>
</tr>
<tr>
<td align="center">Model 5</td>
<td align="center">RF</td>
<td align="center">10</td>
<td align="center">N estimators &#x3d; 147</td>
<td align="center">42745.750</td>
<td align="center">0.974</td>
<td align="center">0.939</td>
<td align="center">0.980</td>
</tr>
</tbody>
</table>
</table-wrap>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Performance of the five best models (included FBG). <bold>(A)</bold> ROC curves. <bold>(B)</bold> Precision&#x2013;recall curves. <bold>(C)</bold> Calibration plots. <bold>(D)</bold> DCA plots.</p>
</caption>
<graphic xlink:href="fphar-14-1216182-g003.tif"/>
</fig>
</sec>
<sec id="s3-4">
<title>3.4 SHapley Additive exPlanation evaluation</title>
<p>SHAP was used to interpret the results from the best model. The result of SHAP in the best model (excluded FBG) is shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. As shown in <xref ref-type="fig" rid="F4">Figure 4A</xref>, SHAP evaluation quantifies the contribution of a feature in a single sample. As results in <xref ref-type="fig" rid="F4">Figure 4B</xref>, previous HbA1c values, having a rational and reasonable diet, course of diabetes, BMI, interval of measurement, duration of treatment regimen, type of manufacturers of metformin, age, waistline, and marital status were the 10 most important variables.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Results of SHAP in the best model (excluded FBG). <bold>(A)</bold> SHAP value contribution graph of each indicator of a single sample. <bold>(B)</bold> Complete distribution of the SHAP values for the top 10 variables.</p>
</caption>
<graphic xlink:href="fphar-14-1216182-g004.tif"/>
</fig>
<p>The results of the contribution of variables in the best model (included FBG) are shown in <xref ref-type="fig" rid="F5">Figure 5</xref>. As illustrated in <xref ref-type="fig" rid="F5">Figure 5A</xref>, waistline, previous HbA1c values, interval of measurement, number of oral drugs, psychological status, EQ-5D scores, type of manufacturers of metformin, and FBG values provided a positive contribution to the SHAP value, while exercise session and course of diabetes provided a negative contribution. As presented in <xref ref-type="fig" rid="F5">Figure 5B</xref>, the 10 most important variables were FBG values, previous HbA1c values, having a rational and reasonable diet, health status scores, type of manufacturers of metformin, interval of measurement, EQ-5D scores, occupational status, and age.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>Results of SHAP in the best model (included FBG). <bold>(A)</bold> SHAP value contribution graph of each indicator of a single sample. <bold>(B)</bold> Complete distribution of the SHAP values for the top 10 variables.</p>
</caption>
<graphic xlink:href="fphar-14-1216182-g005.tif"/>
</fig>
</sec>
<sec id="s3-5">
<title>3.5 Sample size assessment</title>
<p>The adequacy of the sample size was verified using the resampling bootstrapping method, and the results are plotted in <xref ref-type="fig" rid="F6">Figure 6</xref>. The AUC gradually increased and the dispersion of the AUC value decreased as the percentage of the sample size increased. When the sample size reached 60%, the curve flattened. The results indicated that the performance of the model might be slightly affected when expanding the sample size.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Results of sample size validation.</p>
</caption>
<graphic xlink:href="fphar-14-1216182-g006.tif"/>
</fig>
</sec>
<sec id="s3-6">
<title>3.6 Multivariate analysis</title>
<p>As shown in <xref ref-type="table" rid="T5">Table 5</xref>, the number of samples could significantly affect the model prediction performance, including MB, AUC, accuracy, precision, and recall (<italic>p</italic> &#x3c; 0.01). We found that the number of variables could affect the MB and recall of the prediction model significantly (<italic>p</italic> &#x3c; 0.01). MB and AUC were influenced by screening methods (<italic>p</italic> &#x3c; 0.05). Precision was affected by imputing methods (<italic>p</italic> &#x3c; 0.01).</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Results of multivariate analysis.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="center">Factors</th>
<th align="center">MB(&#xa5;)</th>
<th align="center">AUC</th>
<th align="center">Accuracy</th>
<th align="center">Precision</th>
<th align="center">Recall</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="2" align="center">Number of samples</td>
<td align="center">3149.651</td>
<td align="center">&#x2212;0.119</td>
<td align="center">&#x2212;0.02</td>
<td align="center">&#x2212;0.098</td>
<td align="center">&#x2212;0.015</td>
</tr>
<tr>
<td align="center">
<italic>p</italic> &#x3c; 0.001</td>
<td align="center">
<italic>p</italic> &#x3d; 0.002</td>
<td align="center">
<italic>p</italic> &#x3c; 0.001</td>
<td align="center">
<italic>p</italic> &#x3c; 0.001</td>
<td align="center">
<italic>p</italic> &#x3c; 0.001</td>
</tr>
<tr>
<td rowspan="2" align="center">Number of variables</td>
<td align="center">&#x2212;58.292</td>
<td align="center">&#x2212;0.001</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">&#x2212;0.001</td>
</tr>
<tr>
<td align="center">
<italic>p</italic> &#x3d; 0.001</td>
<td align="center">
<italic>p</italic> &#x3d; 0.817</td>
<td align="center">-</td>
<td align="center">-</td>
<td align="center">
<italic>p</italic> &#x3d; 0.005</td>
</tr>
<tr>
<td rowspan="2" align="center">Imputing methods</td>
<td align="center">&#x2212;167.705</td>
<td align="center">0.008</td>
<td align="center">-</td>
<td align="center">0.057</td>
<td align="center">0.002</td>
</tr>
<tr>
<td align="center">
<italic>p</italic> &#x3d; 0.17</td>
<td align="center">
<italic>p</italic> &#x3d; 0.610</td>
<td align="center">-</td>
<td align="center">
<italic>p</italic> &#x3c; 0.001</td>
<td align="center">
<italic>p</italic> &#x3d; 0.196</td>
</tr>
<tr>
<td rowspan="2" align="center">Screening methods</td>
<td align="center">&#x2212;36.986</td>
<td align="center">0.006</td>
<td align="left"/>
<td align="center">0.002</td>
<td align="center">-</td>
</tr>
<tr>
<td align="center">
<italic>p</italic> &#x3d; 0.044</td>
<td align="center">
<italic>p</italic> &#x3d; 0.011</td>
<td align="center">-</td>
<td align="center">
<italic>p</italic> &#x3d; 0.215</td>
<td align="center">-</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>In this research, we developed a total of 192 models (whether they included FBG or not) for the prediction of patients with poor glycemic control in patients with T2D. The MB, AUC, and AUPRC values of the best model were 43475.750 (&#xa5;), 0.972, 0.944, and 0.974, respectively. FBG values, previous HbA1c values, having a rational and reasonable diet, health status scores, type of manufacturers of metformin, interval of measurement, EQ-5D scores, occupational status, and age were the most important contributors to the prediction model.</p>
<p>In recent years, with the continuous development of artificial intelligence techniques, machine learning algorithms have been applied increasingly in clinical prediction models, and disease prediction models have begun to become a hot spot in clinical research. According to the TRIPOD checklist (<xref ref-type="bibr" rid="B10">Collins et al., 2015</xref>), the performance measures (with CI) for the prediction model should be reported. The AUC on validation data has represented the prediction abilities of models in most studies (<xref ref-type="bibr" rid="B6">Chan et al., 2021</xref>; <xref ref-type="bibr" rid="B15">Gibbons et al., 2021</xref>; <xref ref-type="bibr" rid="B12">de Souza et al., 2022</xref>; <xref ref-type="bibr" rid="B45">Yu et al., 2022</xref>). In addition, some prediction models have been internally validated by Harrell&#x2019;s concordance index, the Brier score, and a satisfactory calibration curve (<xref ref-type="bibr" rid="B30">Qu et al., 2021</xref>; <xref ref-type="bibr" rid="B27">Lo-Ciganic et al., 2022</xref>). These aforementioned performance metrics pay more attention to the accuracy of the model and result in less clinical cost caused by wrong prediction or negative predictive value. In this study, we explored a novel measure that could overcome the limitation. Referring to the principles of pharmacoeconomic analysis, parameters for a cost&#x2013;benefit analysis are costs for drugs and benefits for treatments. The worst outcomes of the absence of the HbA1c test were considered to lead to treatment inertia in this study. The economic burden associated with therapeutic inertia was regarded as the cost of negative predictive value, and these data were obtained from the study in patients with type 2 diabetes in Denmark (<xref ref-type="bibr" rid="B26">Lindvig et al., 2021</xref>). The fee for the HbA1c test was considered as the cost of treatment. Therefore, the MB of the best model in the study was 43475.750 (&#xa5;), suggesting that significant gains may result from the prediction model.</p>
<p>The primary goals in the treatment of patients with T2D are to maintain blood glucose levels as close to normal as possible and to achieve a relatively normal quality of life. Scientists early realized that both of these goals are influenced by a multitude of somatic and psychological factors (<xref ref-type="bibr" rid="B33">Rose et al., 2002</xref>; <xref ref-type="bibr" rid="B43">Williams et al., 2005</xref>). In addition, studies reported that educational level, age, duration of diabetes, BMI, and HbA1c at baseline were associated with HbA1c (<xref ref-type="bibr" rid="B19">Hu et al., 2020</xref>). One research reminded that occupational categories were relational to T2D (<xref ref-type="bibr" rid="B2">Baek et al., 2019</xref>). According to the results of SHAP in our study, the 10 most important variables were FBG values, previous HbA1c values, having a rational and reasonable diet, health status scores, type of manufacturers of metformin, interval of measurement, EQ-5D scores, occupational status, and age. The relationship between HbA1c and average glucose levels has been explored in many studies (<xref ref-type="bibr" rid="B22">Law et al., 2017</xref>). Meanwhile, this study developed prediction models on the different data (excluded FGB vs. included FGB). The results suggested that incorporating FGB into the models can allow for further improvements in predictive performance (3163.800 (&#xa5;) vs. 43475.750 (&#xa5;)).</p>
<p>In this study, multiple methods and algorithms were applied to build models. Because of their different principles, the methods and algorithms have different strengths and weaknesses. Specifically, four imputing methods were used to fill in missing values. The SI method fills with fixed values (<xref ref-type="bibr" rid="B28">L&#xf6;w et al., 2019</xref>): the missing value of a continuous variable is replaced by the mean of the variable, and the missing value of a categorical variable is filled with the median. KNN (<xref ref-type="bibr" rid="B4">Beretta and Santaniello, 2016</xref>) and RF (<xref ref-type="bibr" rid="B25">Liao et al., 2022</xref>) are ensemble prediction methods and put out the predictive value to fill in the missing value of variables based on the variables without missing value. Compared to the fixed value, the predicted value should theoretically be similar to the true value. Meanwhile, this will also artificially increase the connection between variables. OD is a normal method to exclude variables with missing values, which we recently proposed. The principle of the algorithm was to keep the maximum sample size with no missing value by deleting variables (columns of the table) or samples (rows of the table). According to the results of the multivariate analysis (shown in <xref ref-type="table" rid="T5">Table 5</xref>), methods and algorithms could significantly affect the prediction performance. So, it is necessary to try which method is the most suitable for data preprocessing or modeling. On the same lines, XGBoost, LGBM, and CatBoost were implementations of gradient-boosting tree-based ensemble methods. The MB of LGBM was higher than that of others both in data that excluded the FGB value or data that included the FGB value (<xref ref-type="table" rid="T3">Table 3</xref>; <xref ref-type="table" rid="T4">Table 4</xref>), which was similar to a previous research (<xref ref-type="bibr" rid="B46">Zhang et al., 2022</xref>).</p>
</sec>
<sec id="s5">
<title>5 Limitation</title>
<p>First, the data were collected prospectively, but our study has the inherent limitations of a single-center retrospective analysis. Although the sample size in our study has been demonstrated to be suitable for modeling, more samples need to be collected in order to verify this prediction model, or a large multicenter sample study is desired that can substantiate the applicability of the model. Second, due to the retrospective research, for some variables, recall bias still exists, such as the intensity of exercise and exercise sessions.</p>
</sec>
<sec sec-type="conclusion" id="s6">
<title>6 Conclusion</title>
<p>In summary, the present research introduced 192 machine learning models to predict poor glycemic control in patients with T2D and proposed a new indicator to evaluate the performance of the prediction model. In fact, we developed a prediction model with better classifier performance. This work also reconfirmed that variables such as FBG values, previous HbA1c values, having a rational and reasonable diet, health status scores, interval of measurement, EQ-5D scores, occupational status, and age were risk factors for glycemic control. We are in the process of developing a mobile app or a Web server for caregivers and patients in an effort to integrate the glycemic control enhancement intervention into daily T2D management.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s7">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/Supplementary Material; further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s8">
<title>Ethics statement</title>
<p>The studies involving human participants were reviewed and approved by the Ethics Committee of the Sichuan Provincial People&#x2019;s Hospital (approval &#x23; 2018-53). The ethics committee waived the requirement of written informed consent for participation.</p>
</sec>
<sec id="s9">
<title>Author contributions</title>
<p>Y-TT contributed to data collection, data analysis, writing, and approval of the final manuscript. G-JG and HC assisted in data analysis and model design. X-WW and M-TL were responsible for designing and coordinating the research. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="s10">
<title>Funding</title>
<p>This study was funded by the National Natural Science Foundation of China (grant nos. 72004020 and 72174038), the National Key R&#x26;D Research Program of China, the National Key Research Program (grant no. 2020YFC2005506), and the Scientific Research Foundation of Sichuan Provincial People&#x2019;s Hospital (grant no. 2022BH10).</p>
</sec>
<sec sec-type="COI-statement" id="s11">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s12">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors, and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ahlqvist</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Tuomi</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Groop</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Clusters provide a better holistic view of type 2 diabetes than simple clinical features</article-title>. <source>Lancet Diabetes Endocrinol.</source> <volume>7</volume>, <fpage>668</fpage>&#x2013;<lpage>669</lpage>. <pub-id pub-id-type="doi">10.1016/S2213-8587(19)30257-8</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Baek</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>G. R.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>E. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Cross-sectional study of the association between long working hours and pre-diabetes: 2010-2017 korea national health and nutrition examination survey</article-title>. <source>BMJ Open</source> <volume>9</volume>, <fpage>033579</fpage>. <pub-id pub-id-type="doi">10.1136/bmjopen-2019-033579</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bent&#xe9;JAC</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Cs&#xf6;RG&#x150;</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mart&#xed;NEZ-Mu&#xf1;OZ</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>A comparative analysis of gradient boosting algorithms</article-title>. <source>Artif. Intell. Rev.</source> <volume>54</volume>, <fpage>1937</fpage>&#x2013;<lpage>1967</lpage>. <pub-id pub-id-type="doi">10.1007/s10462-020-09896-5</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Beretta</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Santaniello</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Nearest neighbor imputation algorithms: A critical evaluation</article-title>. <source>BMC Med. Inf. Decis. Mak.</source> <volume>16</volume> (<issue>3</issue>), <fpage>74</fpage>. <pub-id pub-id-type="doi">10.1186/s12911-016-0318-z</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Breiman</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Random forests</article-title>. <source>Mach. Learn.</source> <volume>45</volume>, <fpage>5</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1023/a:1010933404324</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chan</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Nadkarni</surname>
<given-names>G. N.</given-names>
</name>
<name>
<surname>Fleming</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>McCullough</surname>
<given-names>J. R.</given-names>
</name>
<name>
<surname>Connolly</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Mosoyan</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Derivation and validation of a machine learning risk score using biomarker and electronic patient data to predict progression of diabetic kidney disease</article-title>. <source>Diabetologia</source> <volume>64</volume>, <fpage>1504</fpage>&#x2013;<lpage>1515</lpage>. <pub-id pub-id-type="doi">10.1007/s00125-021-05444-0</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<collab>Chinese Diabetes Society</collab> (<year>2017</year>). <article-title>Guideline for the prevention and control of type 2 diabetes in China(2017 edition)</article-title>. <source>Chin. J. Pract. Intern. Med.</source> <volume>38</volume>, <fpage>292</fpage>&#x2013;<lpage>344</lpage>. <pub-id pub-id-type="doi">10.19538/j.nk2018040108</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<collab>Chinese Diabetes Society</collab> (<year>2021</year>). <article-title>Guideline for the prevention and treatment of type 2 diabetes mellitus in China(2020 edition)</article-title>. <source>Chin. J. Pract. Intern. Med.</source> <volume>41</volume>, <fpage>668</fpage>&#x2013;<lpage>695</lpage>. <pub-id pub-id-type="doi">10.19538/j.nk2021080106</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Christine</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Moore</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Crawford</surname>
<given-names>N. D.</given-names>
</name>
<name>
<surname>Barrientos-Gutierrez</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>S&#xe1;nchez</surname>
<given-names>B. N.</given-names>
</name>
<name>
<surname>Seeman</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Exposure to neighborhood foreclosures and changes in cardiometabolic health: Results from MESA</article-title>. <source>Am. J. Epidemiol.</source> <volume>185</volume>, <fpage>106</fpage>&#x2013;<lpage>114</lpage>. <pub-id pub-id-type="doi">10.1093/aje/kww186</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Chen</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Guestrin</surname>
<given-names>C.</given-names>
</name>
</person-group> (<year>2016</year>). &#x201c;<article-title>XGBoost: A scalable tree boosting system [M]</article-title>,&#x201d; in <conf-name>Proceedings of the 22nd ACM SIGKDD international conference on knowledge Discovery and data mining - KDD &#x2019;16</conf-name>, <conf-loc>San Francisco, CA</conf-loc>, <conf-date>August 13&#x2013;17, 2016</conf-date>. (<publisher-name>ACM</publisher-name>).</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Collins</surname>
<given-names>G. S.</given-names>
</name>
<name>
<surname>Reitsma</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Altman</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Moons</surname>
<given-names>K. G. M.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD): The TRIPOD statement</article-title>. <source>Br. J. Surg.</source> <volume>102</volume>, <fpage>148</fpage>&#x2013;<lpage>158</lpage>. <pub-id pub-id-type="doi">10.1002/bjs.9736</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davies</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Aroda</surname>
<given-names>V. R.</given-names>
</name>
<name>
<surname>Collins</surname>
<given-names>B. S.</given-names>
</name>
<name>
<surname>Gabbay</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Maruthur</surname>
<given-names>N. M.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Management of hyperglycemia in type 2 diabetes, 2022. A consensus report by the American diabetes association (ADA) and the European association for the study of diabetes (EASD)</article-title>. <source>Diabetes Care</source> <volume>45</volume>, <fpage>2753</fpage>&#x2013;<lpage>2786</lpage>. <pub-id pub-id-type="doi">10.2337/dci22-0034</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>De Souza</surname>
<given-names>E. S. C. G.</given-names>
</name>
<name>
<surname>Buginga</surname>
<given-names>G. C.</given-names>
</name>
<name>
<surname>De Souza</surname>
<given-names>E. S. E. A.</given-names>
</name>
<name>
<surname>Arena</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Rouleau</surname>
<given-names>C. R.</given-names>
</name>
<name>
<surname>Aggarwal</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Prediction of mortality in coronary artery disease: Role of machine learning and maximal exercise capacity</article-title>. <source>Mayo Clin. Proc.</source> <volume>97</volume>, <fpage>1472</fpage>&#x2013;<lpage>1482</lpage>. <pub-id pub-id-type="doi">10.1016/j.mayocp.2022.01.016</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dennis</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Shields</surname>
<given-names>B. M.</given-names>
</name>
<name>
<surname>Henley</surname>
<given-names>W. E.</given-names>
</name>
<name>
<surname>Jones</surname>
<given-names>A. G.</given-names>
</name>
<name>
<surname>Hattersley</surname>
<given-names>A. T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Disease progression and treatment response in data-driven subgroups of type 2 diabetes compared with models based on simple clinical features: An analysis using clinical trial data</article-title>. <source>Lancet Diabetes Endocrinol.</source> <volume>7</volume>, <fpage>442</fpage>&#x2013;<lpage>451</lpage>. <pub-id pub-id-type="doi">10.1016/S2213-8587(19)30087-7</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Friedman</surname>
<given-names>J. H.</given-names>
</name>
</person-group> (<year>2001</year>). <article-title>Greedy function approximation: A gradient boosting machine</article-title>. <source>Ann. Statistics</source> <volume>29</volume>, <fpage>44</fpage>. <pub-id pub-id-type="doi">10.1214/aos/1013203451</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gibbons</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>A. M. Z.</given-names>
</name>
<name>
<surname>Ma</surname>
<given-names>R. C. W.</given-names>
</name>
<name>
<surname>Tam</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Catalano</surname>
<given-names>P. M.</given-names>
</name>
<name>
<surname>Sacks</surname>
<given-names>D. A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Prediction of large-for-gestational age infants in relation to hyperglycemia in pregnancy - a comparison of statistical models</article-title>. <source>Diabetes Res. Clin. Pract.</source> <volume>178</volume>, <fpage>108975</fpage>. <pub-id pub-id-type="doi">10.1016/j.diabres.2021.108975</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Griffith</surname>
<given-names>K. N.</given-names>
</name>
<name>
<surname>Prentice</surname>
<given-names>J. C.</given-names>
</name>
<name>
<surname>Mohr</surname>
<given-names>D. C.</given-names>
</name>
<name>
<surname>Conlin</surname>
<given-names>P. R.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predicting 5- and 10-year mortality risk in older adults with diabetes</article-title>. <source>Diabetes Care</source> <volume>43</volume>, <fpage>1724</fpage>&#x2013;<lpage>1731</lpage>. <pub-id pub-id-type="doi">10.2337/dc19-1870</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Guolin</surname>
<given-names>K. Q. M.</given-names>
</name>
<name>
<surname>Thomas</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Weidong</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Qiwei</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>LightGBM: A highly efficient gradient boosting decision tree [M]</article-title>. <source>Adv. Neural Inf. Process. Syst.</source> <volume>30</volume>, <fpage>8</fpage>.</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Heerspink</surname>
<given-names>H. J. L.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Predicting individual treatment response in diabetes</article-title>. <source>Lancet Diabetes Endocrinol.</source> <volume>7</volume>, <fpage>415</fpage>&#x2013;<lpage>417</lpage>. <pub-id pub-id-type="doi">10.1016/S2213-8587(19)30118-4</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Shen</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Yan</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Ding</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Relationship between estimated glycosylated hemoglobin using flash glucose monitoring and actual measured glycosylated hemoglobin in a Chinese population</article-title>. <source>Diabetes Ther.</source> <volume>11</volume>, <fpage>2019</fpage>&#x2013;<lpage>2027</lpage>. <pub-id pub-id-type="doi">10.1007/s13300-020-00879-x</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jaillard</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Palmieri</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Van Belkum</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mah&#xe9;</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Interpreting k-mer-based signatures for antibiotic resistance prediction</article-title>. <source>Gigascience</source> <volume>9</volume>, <fpage>110</fpage>. <pub-id pub-id-type="doi">10.1093/gigascience/giaa110</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kursa</surname>
<given-names>M. B. R. W. R.</given-names>
</name>
<name>
<surname>Rudnicki</surname>
<given-names>W. R.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Feature selection with the Boruta package</article-title>. <source>J. Stat. Softw.</source> <volume>36</volume>, <fpage>13</fpage>. <pub-id pub-id-type="doi">10.18637/jss.v036.i11</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Law</surname>
<given-names>G. R.</given-names>
</name>
<name>
<surname>Gilthorpe</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Secher</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Temple</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Bilous</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Mathiesen</surname>
<given-names>E. R.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Translating HbA(1c) measurements into estimated average glucose values in pregnant women with diabetes</article-title>. <source>Diabetologia</source> <volume>60</volume>, <fpage>618</fpage>&#x2013;<lpage>624</lpage>. <pub-id pub-id-type="doi">10.1007/s00125-017-4205-7</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Leong</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Daya</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Porneala</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Devlin</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Shiffman</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>McPhaul</surname>
<given-names>M. J.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Prediction of type 2 diabetes by hemoglobin A(1c) in two community-based cohorts</article-title>. <source>Diabetes Care</source> <volume>41</volume>, <fpage>60</fpage>&#x2013;<lpage>68</lpage>. <pub-id pub-id-type="doi">10.2337/dc17-0607</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lewin-Epstein</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Baruch</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hadany</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Stein</surname>
<given-names>G. Y.</given-names>
</name>
<name>
<surname>Obolski</surname>
<given-names>U.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predicting antibiotic resistance in hospitalized patients by applying machine learning to electronic medical records</article-title>. <source>Clin. Infect. Dis.</source> <volume>72</volume>, <fpage>e848</fpage>&#x2013;<lpage>e855</lpage>. <pub-id pub-id-type="doi">10.1093/cid/ciaa1576</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liao</surname>
<given-names>L. D.</given-names>
</name>
<name>
<surname>Ferrara</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Greenberg</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Ngo</surname>
<given-names>A. L.</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Development and validation of prediction models for gestational diabetes treatment modality using supervised machine learning: A population-based cohort study</article-title>. <source>BMC Med.</source> <volume>20</volume>, <fpage>307</fpage>. <pub-id pub-id-type="doi">10.1186/s12916-022-02499-7</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lindvig</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tran</surname>
<given-names>M. P.</given-names>
</name>
<name>
<surname>Kidd</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Tikkanen</surname>
<given-names>C. K.</given-names>
</name>
<name>
<surname>G&#xe6;de</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>The economic burden of poor glycemic control associated with therapeutic inertia in patients with type 2 diabetes in Denmark</article-title>. <source>Curr. Med. Res. Opin.</source> <volume>37</volume>, <fpage>949</fpage>&#x2013;<lpage>956</lpage>. <pub-id pub-id-type="doi">10.1080/03007995.2021.1904863</pub-id>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lo-Ciganic</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Donohue</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>J. L.</given-names>
</name>
<name>
<surname>Chang</surname>
<given-names>C. Y.</given-names>
</name>
<name>
<surname>Weiss</surname>
<given-names>J. C.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Developing and validating a machine-learning algorithm to predict opioid overdose in medicaid beneficiaries in two US states: A prognostic modelling study</article-title>. <source>Lancet Digit. Health</source> <volume>4</volume>, <fpage>e455</fpage>&#x2013;<lpage>e465</lpage>. <pub-id pub-id-type="doi">10.1016/S2589-7500(22)00062-0</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>L&#xf6;W</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Hesser</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Blessing</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Multiple retrieval case-based reasoning for incomplete datasets</article-title>. <source>J. Biomed. Inf.</source> <volume>92</volume>, <fpage>103127</fpage>. <pub-id pub-id-type="doi">10.1016/j.jbi.2019.103127</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Marquardt</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Snee</surname>
<given-names>R. D.</given-names>
</name>
</person-group> (<year>1975</year>). <article-title>Ridge regression in practice</article-title>. <source>The American Statistician</source> <volume>29</volume> (<issue>1</issue>), <fpage>3</fpage>&#x2013;<lpage>20</lpage>. <pub-id pub-id-type="doi">10.1080/00031305.1975.10479105</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Duan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Predicting the risk of pulmonary arterial hypertension in systemic lupus erythematosus: A Chinese systemic lupus erythematosus treatment and research group cohort study</article-title>. <source>Arthritis Rheumatol.</source> <volume>73</volume>, <fpage>1847</fpage>&#x2013;<lpage>1855</lpage>. <pub-id pub-id-type="doi">10.1002/art.41740</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Reach</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Pechtner</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Gentilella</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Corcos</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Ceriello</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Clinical inertia and its impact on treatment intensification in people with type 2 diabetes mellitus</article-title>. <source>Diabetes Metab.</source> <volume>43</volume>, <fpage>501</fpage>&#x2013;<lpage>511</lpage>. <pub-id pub-id-type="doi">10.1016/j.diabet.2017.06.003</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rohlfing</surname>
<given-names>C. L.</given-names>
</name>
<name>
<surname>Wiedmeyer</surname>
<given-names>H. M.</given-names>
</name>
<name>
<surname>Little</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>England</surname>
<given-names>J. D.</given-names>
</name>
<name>
<surname>Tennill</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Goldstein</surname>
<given-names>D. E.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>Defining the relationship between plasma glucose and HbA(1c): Analysis of glucose profiles and HbA(1c) in the diabetes control and complications trial</article-title>. <source>Diabetes Care</source> <volume>25</volume>, <fpage>275</fpage>&#x2013;<lpage>278</lpage>. <pub-id pub-id-type="doi">10.2337/diacare.25.2.275</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rose</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fliege</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hildebrandt</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Schirop</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Klapp</surname>
<given-names>B. F.</given-names>
</name>
</person-group> (<year>2002</year>). <article-title>The network of psychological variables in patients with diabetes and their importance for quality of life and metabolic control</article-title>. <source>Diabetes Care</source> <volume>25</volume>, <fpage>35</fpage>&#x2013;<lpage>42</lpage>. <pub-id pub-id-type="doi">10.2337/diacare.25.1.35</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Simon</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Friedman</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hastie</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>Regularization paths for cox&#x27;s proportional hazards model via coordinate descent</article-title>. <source>J. Stat. Softw.</source> <volume>39</volume>, <fpage>1</fpage>&#x2013;<lpage>13</lpage>. <pub-id pub-id-type="doi">10.18637/jss.v039.i05</pub-id>
</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singha</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Dong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>High resolution paddy rice maps in cloud-prone Bangladesh and Northeast India using Sentinel-1 data</article-title>. <source>Sci. Data</source> <volume>6</volume>, <fpage>26</fpage>. <pub-id pub-id-type="doi">10.1038/s41597-019-0036-3</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sun</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Saeedi</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Karuranga</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Pinkepank</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ogurtsova</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Duncan</surname>
<given-names>B. B.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>IDF Diabetes Atlas: Global, regional and country-level diabetes prevalence estimates for 2021 and projections for 2045</article-title>. <source>Diabetes Res. Clin. Pract.</source> <volume>183</volume>, <fpage>109119</fpage>. <pub-id pub-id-type="doi">10.1016/j.diabres.2021.109119</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tibshirani</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>The lasso method for variable selection in the Cox model</article-title>. <source>Stat. Med.</source> <volume>16</volume>, <fpage>385</fpage>&#x2013;<lpage>395</lpage>. <pub-id pub-id-type="doi">10.1002/(sici)1097-0258(19970228)16:4&#x3c;385:aid-sim380&#x3e;3.0.co;2-3</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Wan</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Liang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Guizani</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2018</year>). <source>Deep multi-layer Perceptron classifier for behavior analysis to estimate Parkinson&#x27;s disease severity using smartphones</source>. <publisher-name>IEEE Access</publisher-name> <volume>6</volume>, <fpage>36825</fpage>&#x2013;<lpage>36833</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2018.2851382</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Fan</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Hong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Applying machine learning models to predict medication nonadherence in crohn&#x27;s disease maintenance therapy</article-title>. <source>Patient Prefer Adherence</source> <volume>14</volume>, <fpage>917</fpage>&#x2013;<lpage>926</lpage>. <pub-id pub-id-type="doi">10.2147/PPA.S253732</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Xiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Xie</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Nie</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Maillard reaction between oligopeptides and reducing sugar at body temperature: The putative anti-glycation agents</article-title>. <source>Front. Nutr.</source> <volume>9</volume>, <fpage>1062777</fpage>. <pub-id pub-id-type="doi">10.3389/fnut.2022.1062777</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Fu</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Capsule networks showed excellent performance in the classification of hERG blockers/nonblockers</article-title>. <source>Front. Pharmacol.</source> <volume>10</volume>, <fpage>1631</fpage>. <pub-id pub-id-type="doi">10.3389/fphar.2019.01631</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Williams</surname>
<given-names>G. C.</given-names>
</name>
<name>
<surname>Mcgregor</surname>
<given-names>H. A.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Nelson</surname>
<given-names>C. C.</given-names>
</name>
<name>
<surname>Glasgow</surname>
<given-names>R. E.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Variation in perceived competence, glycemic control, and patient satisfaction: Relationship to autonomy support from physicians</article-title>. <source>Patient Educ. Couns.</source> <volume>57</volume>, <fpage>39</fpage>&#x2013;<lpage>45</lpage>. <pub-id pub-id-type="doi">10.1016/j.pec.2004.04.001</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wu</surname>
<given-names>X. W.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>H. B.</given-names>
</name>
<name>
<surname>Yuan</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Long</surname>
<given-names>E. W.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>R. S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Predictive models of medication non-adherence risks of patients with T2D based on multiple machine learning algorithms</article-title>. <source>BMJ Open Diabetes Res. Care</source> <volume>8</volume>, <fpage>001055</fpage>. <pub-id pub-id-type="doi">10.1136/bmjdrc-2019-001055</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yu</surname>
<given-names>Y. D.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K. S.</given-names>
</name>
<name>
<surname>Man Kim</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ryu</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Lee</surname>
<given-names>K. W.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Artificial intelligence for predicting survival following deceased donor liver transplantation: Retrospective multi-center study</article-title>. <source>Int. J. Surg.</source> <volume>105</volume>, <fpage>106838</fpage>. <pub-id pub-id-type="doi">10.1016/j.ijsu.2022.106838</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kalbaugh</surname>
<given-names>C. A.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Divers</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Islam</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2022</year>). <article-title>Machine learning approach to predict in-hospital mortality in patients admitted for peripheral artery disease in the United States</article-title>. <source>J. Am. Heart Assoc.</source> <volume>11</volume>, <fpage>026987</fpage>. <pub-id pub-id-type="doi">10.1161/JAHA.122.026987</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>