<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Chem.</journal-id>
<journal-title>Frontiers in Chemistry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Chem.</abbrev-journal-title>
<issn pub-type="epub">2296-2646</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1056701</article-id>
<article-id pub-id-type="doi">10.3389/fchem.2022.1056701</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Chemistry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Development of QSRR model for hydroxamic acids using PCA-GA-BP algorithm incorporated with molecular interaction-based features</article-title>
<alt-title alt-title-type="left-running-head">Nie et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/fchem.2022.1056701">10.3389/fchem.2022.1056701</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Nie</surname>
<given-names>Yiming</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/2029602/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Jia</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Yang</surname>
<given-names>Xinying</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Hou</surname>
<given-names>Xuben</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1170708/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Fang</surname>
<given-names>Hao</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/14605/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Medicinal Chemistry</institution>, <institution>School of Pharmaceutical Sciences</institution>, <institution>Cheeloo College of Medicine</institution>, <institution>Shandong University</institution>, <addr-line>Jinan</addr-line>, <addr-line>Shandong</addr-line>, <country>China</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Department of Pharmaceutical Analysis</institution>, <institution>School of Pharmaceutical Sciences</institution>, <institution>Cheeloo College of Medicine</institution>, <institution>Shandong University</institution>, <addr-line>Jinan</addr-line>, <addr-line>Shandong</addr-line>, <country>China</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1095858/overview">Kshatresh Dutta Dubey</ext-link>, Shiv Nadar University, India</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/532732/overview">Marcus Scotti</ext-link>, Federal University of Para&#xed;ba, Brazil</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1960083/overview">Maryam Salahinejad</ext-link>, Nuclear Science and Technology Research Institute (NSTRI), Iran</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Xinying Yang, <email>xinyingyang@sdu.edu.cn</email>; Xuben Hou, <email>hxb@sdu.edu.cn</email>; Hao Fang, <email>haofangcn@sdu.edu.cn</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Theoretical and Computational Chemistry, a section of the journal Frontiers in Chemistry</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>11</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>10</volume>
<elocation-id>1056701</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>09</month>
<year>2022</year>
</date>
<date date-type="accepted">
<day>09</day>
<month>11</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Nie, Li, Yang, Hou and Fang.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Nie, Li, Yang, Hou and Fang</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>As a potent zinc chelator, hydroxamic acid has been applied in the design of inhibitors of zinc metalloenzyme, such as histone deacetylases (HDACs). A series of hydroxamic acids with HDAC inhibitory activities were subjected to the QSRR (Quantitative Structure&#x2013;Retention Relationships) study. Experimental data in combination with calculated molecular descriptors were used for the development of the QSRR model. Specially, we employed PCA (principal component analysis) to accomplish dimension reduction of descriptors and utilized the principal components of compounds (16 training compounds, 4 validation compounds and 7 test compounds) to execute GA (genetic algorithm)-BP (error backpropagation) algorithm. We performed double cross-validation approach for obtaining a more convincing model. Moreover, we introduced molecular interaction-based features (molecular docking scores) as a new type of molecular descriptor to represent the interactions between analytes and the mobile phase. Our results indicated that the incorporation of molecular interaction-based features significantly improved the accuracy of the QSRR model, (R<sup>2</sup> value is 0.842, RMSEP value is 0.440, and MAE value is 0.573). Our study not only developed QSRR model for the prediction of the retention time of hydroxamic acid in HPLC but also proved the feasibility of using molecular interaction-based features as molecular descriptors.</p>
</abstract>
<kwd-group>
<kwd>structure retention relationships</kwd>
<kwd>hydroxamic acids</kwd>
<kwd>HPLC</kwd>
<kwd>molecular docking</kwd>
<kwd>PCA</kwd>
<kwd>GA-BP</kwd>
<kwd>double cross-validation</kwd>
</kwd-group>
<contract-num rid="cn001">81874288 92053105 82003590</contract-num>
<contract-num rid="cn002">ZR2019LZL004 ZR2020QH342</contract-num>
<contract-sponsor id="cn001">National Natural Science Foundation of China<named-content content-type="fundref-id">10.13039/501100001809</named-content>
</contract-sponsor>
<contract-sponsor id="cn002">Natural Science Fund for Distinguished Young Scholars of Shandong Province<named-content content-type="fundref-id">10.13039/100017445</named-content>
</contract-sponsor>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>Hydroxamic acids have metal chelating properties. Especially, due to the high chelating power to zinc ions, hydroxamic acids are widely used as inhibitors of enzymes having a Zn<sup>2&#x2b;</sup> in the active site (matrix metalloproteinases (MMPs), tumor necrosis factor-alpha (TNF-&#x3b1;) converting enzyme, and histone deacetylase (HDAC)) (<xref ref-type="bibr" rid="B41">Schaal et al., 2018</xref>; <xref ref-type="bibr" rid="B15">Ho et al., 2020</xref>; <xref ref-type="bibr" rid="B40">Sanyal et al., 2022</xref>). Moreover, some drugs possessing hydroxamic acid structure, especially HDAC inhibitors, have been approved for the clinic (<xref ref-type="fig" rid="F1">Figure 1</xref>) (<xref ref-type="bibr" rid="B15">Ho et al., 2020</xref>). However, compounds having hydroxamic acid structure usually possess poor solubility and affect their chromatography analyze of them.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Chemical structures of hydroxamic acid-based drugs have been approved for the clinic or in clinical trails.</p>
</caption>
<graphic xlink:href="fchem-10-1056701-g001.tif"/>
</fig>
<p>Chromatography is a method by which we can obtain a lot of precise, comparable, and repeatable retention data for structure-diverse compounds. At the same experimental conditions, we can get the almost same results on analytes&#x2019; retention data. In a chromatographic system, the molecular structure of a compound determines its properties, and further, affect relative affinity for the mobile and stationary phases and, therefore, its retention characteristics (<xref ref-type="bibr" rid="B36">Roman, 2007</xref>; <xref ref-type="bibr" rid="B13">Ganesh et al., 2022</xref>). The quantitative structure-retention relationships (QSRR) have been used as a model approach to establish methods of property prediction (<xref ref-type="bibr" rid="B36">Roman, 2007</xref>). So the construction of the QSRR model is helpful for the chromatography of hydroxamic acids. Reliable structural descriptors are necessary for QSRR models. Here, we choose the results of the scoring functions based on experience as the new structural descriptors to regression analysis for the first time. Scoring functions are usually used to evaluate the rationality of the receptor-ligand binding mode obtained theoretically. They also can be applied to estimate the binding affinity between the receptor and ligands for molecular docking and virtual screening.</p>
<p>Each analyte has its retention behavior in a chromatographic system. To great extent, the analyte&#x2019;s retention behavior depends on the stationary phase of the chromatographic column and its structure. Some studies have reported the models to characterize the conformation of ODS (Octadecylsilyl) material (<xref ref-type="fig" rid="F2">Figure 2A</xref>) and the interaction with solvent molecules (<xref ref-type="bibr" rid="B20">Ledesma and Wornat, 2000</xref>; <xref ref-type="bibr" rid="B6">Brambilla et al., 2007</xref>). Meanwhile, docking procedure has been used to select the best pose for each ligand to build QSPR model and docking descriptors are calculated based on the major interactions between ligand and cyclodextrin (<xref ref-type="bibr" rid="B27">Mirrahimi et al., 2016</xref>). So we hypothesize the material of stationary phase (ODS) and the analytes in the mobile phase as &#x2018;receptors&#x2019; and &#x2018;ligands&#x2019; respectively to simulate the combination between protein and ligands. Then we can get some scores that can characterize the molecular interaction-based feature and be used as descriptors through various scoring functions. We attempted to adopt the molecular modeling and docking method and consider the docking scores (molecular interaction-based features) as descriptors to characterize the interaction between the stationary phase and analytes for estimating a more reliable QSRR model.</p>
<p>Multiple variables can provide abundant information for the research technically. But in many cases, there may be correlations between variables, which increases the complexity of problem analysis. PCA (principal component analysis) is one of the most widely used data dimension reduction algorithms. It can eliminate noise and some unimportant information and change the variables into a few independent integrated variables which can stand for the most kinds of information existing in each original variable (<xref ref-type="bibr" rid="B31">Prasad et al., 2022</xref>). A certain range of information loss can save us a lot of time and cost. BP (error backpropagation) neural network is a neural network algorithm used in QSPR (quantitative structure-property relationships) research, QSAR (quantitative structure-activity relationships) research, and other models&#x2019; establishment widely and can handle complex data effectively (<xref ref-type="bibr" rid="B25">Luo et al., 2015</xref>; <xref ref-type="bibr" rid="B3">Bahmani et al., 2021</xref>; <xref ref-type="bibr" rid="B54">Yang et al., 2021</xref>; <xref ref-type="bibr" rid="B53">Xie and Xue, 2022</xref>). Therefore, we applied it in the establishment of the QSRR model. Meanwhile, the GA (genetic algorithm) is capable of optimizing the initial weight and threshold, thereby improving the robustness of the BP neural network (<xref ref-type="bibr" rid="B55">Zhang et al., 2019</xref>; <xref ref-type="bibr" rid="B10">Fang et al., 2022</xref>). And because of the wide application of hydroxamic acids in the area of HDAC inhibitors, we apply the PCA-GA-BP (<xref ref-type="bibr" rid="B30">Pan et al., 2007</xref>; <xref ref-type="bibr" rid="B55">Zhang et al., 2019</xref>; <xref ref-type="bibr" rid="B22">Li et al., 2020</xref>; <xref ref-type="bibr" rid="B10">Fang et al., 2022</xref>) neural network to establish the QSRR model to predict the retention time of hydroxamic acid-based HDAC inhibitors, for making it convenient to do HPLC and test whether molecular interaction-based features can be applied as new structure descriptors. Meanwhile, to ensure reliability and precision, we utilized double cross-validation, which contains internal (inner) and external (outer) cross-validation loops, to establish models (<xref ref-type="bibr" rid="B37">Roy and Arnbure, 2016</xref>).</p>
</sec>
<sec id="s2">
<title>Experimental</title>
<sec id="s2-1">
<title>Chemicals and materials</title>
<p>If not specified, all chemicals were of analytical grade. The methanol was purchased from Fisher Chemical (HPLC Grade), while the formic acid was obtained from Kermel. The ultra-pure water was obtained from Heal Force SPW ultra-pure water system. All the twenty-seven analytes, including the marketed drugs or the compounds reported by our group&#x2019;s former work (<xref ref-type="bibr" rid="B51">Wang et al., 2014</xref>; <xref ref-type="bibr" rid="B12">Fu et al., 2015</xref>; <xref ref-type="bibr" rid="B24">Liu et al., 2016</xref>), were the compounds possessing hydroxamic acid structure and were synthesized and confirmed by ourselves.</p>
</sec>
<sec id="s2-2">
<title>HPLC analysis</title>
<p>All the compounds were tested on Agilent 1,100 system (Agilent Technologies, USA), equipped with a quaternary pump, manual injector (20&#xa0;&#x3bc;L sample loop), and VWD detector. The column used in this study was Phenomenex Luna 5u C18 (150&#x2a;4.6&#xa0;mm 5micron). The mobile phase consisted of 45% aqueous phase (contains 0.1% formic acid) and 55% methanol (contains 0.1% formic acid). The flow rate was 1&#xa0;ml/min and the UV detection was performed at 254&#xa0;nm. The retention time of each analyte was shown in <xref ref-type="sec" rid="s10">Supplementary Table S1</xref>.</p>
</sec>
<sec id="s2-3">
<title>QSRR model generation</title>
<sec id="s2-3-1">
<title>Calculation of the molecular descriptors</title>
<p>The steps of descriptor generation were as follows. First, we sketched molecular structures with ChemDraw 14.0. Then the molecules were minimized using Tripos Field (<xref ref-type="bibr" rid="B52">White, 1977</xref>; <xref ref-type="bibr" rid="B28">Motoc et al., 1986</xref>; <xref ref-type="bibr" rid="B49">Waltho et al., 1988</xref>; <xref ref-type="bibr" rid="B8">Clark et al., 1989</xref>; <xref ref-type="bibr" rid="B32">Purohit et al., 2020</xref>) in Sybyl-X 2.0 (<xref ref-type="bibr" rid="B46">SYBYL, 2012</xref>; <xref ref-type="bibr" rid="B23">Liang et al., 2021</xref>). The lowest energy structures were further optimized by undergoing (<xref ref-type="bibr" rid="B48">Turner et al., 2017</xref>) (PM7) (<xref ref-type="bibr" rid="B45">Stewart, 2013</xref>; <xref ref-type="bibr" rid="B48">Turner et al., 2017</xref>) in Molecular Orbital PACkage (MOPAC 2016) method. Then we used Schr&#xf6;dinger software to carry out the optimization function applying the Becke 3-parameter (exchange) with correlation by Lee Yang and Parr (B3LYP) (<xref ref-type="bibr" rid="B5">Becke, 1988</xref>; <xref ref-type="bibr" rid="B21">Lee et al., 1988</xref>; <xref ref-type="bibr" rid="B4">Becke, 1993</xref>; <xref ref-type="bibr" rid="B44">Stephens et al., 1994</xref>; <xref ref-type="bibr" rid="B1">Adekoya et al., 2022</xref>; <xref ref-type="bibr" rid="B39">Sakr et al., 2022</xref>) functional and the 6-31G (&#x2a;&#x2a;) (<xref ref-type="bibr" rid="B11">Frisch et al., 1984</xref>; <xref ref-type="bibr" rid="B1">Adekoya et al., 2022</xref>; <xref ref-type="bibr" rid="B39">Sakr et al., 2022</xref>) basis set, density functional theory (DFT) (<xref ref-type="bibr" rid="B7">Calais, 1993</xref>; <xref ref-type="bibr" rid="B18">Koch and Holthausen, 2001</xref>; <xref ref-type="bibr" rid="B1">Adekoya et al., 2022</xref>; <xref ref-type="bibr" rid="B39">Sakr et al., 2022</xref>), and the standard Poisson-Boltzmann continuum solvation function (PBF) (<xref ref-type="bibr" rid="B14">Gilson et al., 1985</xref>; <xref ref-type="bibr" rid="B42">Sharp and Honig, 1990</xref>; <xref ref-type="bibr" rid="B47">Tomasi and Persico, 1994</xref>; <xref ref-type="bibr" rid="B50">Wang et al., 2017</xref>) for further geometry optimization.</p>
<p>The Molecular Descriptors function of Schr&#xf6;dinger software was applied to descriptors calculation. The molecular descriptors, Schr&#xf6;dinger software can calculate, contain three main categories: Topological Descriptors, QikProp Properties, and Semiempirical Properties. The Handbook of Molecular Descriptors (<xref ref-type="bibr" rid="B35">Roberto Todeschini and Consonni, 2000</xref>) details the calculation procedure. 273 molecular descriptors were obtained, and for the sake of minimizing subsequent problems of chance correlation, descriptors which were constant or near-constant values, less than 0.0001 concerning standard deviation, strongly correlated (descriptors with a correlation coefficient &#x3e;0.90), and not available for all compounds were excluded. After the pre-reduction step, 197 molecular descriptors were obtained.</p>
</sec>
<sec id="s2-3-2">
<title>Molecular docking</title>
<p>The ODS model was manually established using Sybyl-X 2.0. All the analytes were docked against the ODS model using Surflex-Dock module (<xref ref-type="bibr" rid="B16">Jain, 2007</xref>; <xref ref-type="bibr" rid="B43">Singh et al., 2019</xref>). The representative docking result is shown in <xref ref-type="fig" rid="F2">Figure 2B</xref>. For each analyte, the docked conformation with the highest was selected and 8 different types of docking scores as new descriptors, including Total_Score, Crash, Polar, D_SCORE, PMF_SCORE, G_SCORE, CHEMSCORE, GLOBAL_SCORE (<xref ref-type="bibr" rid="B19">Kuntz et al., 1982</xref>; <xref ref-type="bibr" rid="B9">Eldridge et al., 1997</xref>; <xref ref-type="bibr" rid="B17">Jones et al., 1997</xref>; <xref ref-type="bibr" rid="B29">Muegge and Martin, 1999</xref>). The docking scores of each analyte were summarized in <xref ref-type="sec" rid="s10">Supplementary Table S2</xref> in Supporting Information.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>
<bold>(A)</bold> The liquid-like configuration of ODS. <bold>(B)</bold> Representative docking result of one of the analytes in the ODS (C18) model.</p>
</caption>
<graphic xlink:href="fchem-10-1056701-g002.tif"/>
</fig>
</sec>
<sec id="s2-3-3">
<title>Dimension reduction and the construction of the QSRR model</title>
<p>Because the descriptors were too much to get a good QSRR model rapidly, we performed the PCA on two matrixes, one consists of the descriptors without molecular interaction-based features and the other is made up of the descriptors with molecular interaction-based features, in Matlab (<xref ref-type="bibr" rid="B26">Matlab, 2013</xref>) to achieve the dimension reduction of independent variables (molecular descriptors). Before that, all the descriptors had to be standardized. The principal components which can reflect 95% of the original data were chosen for the building of the QSRR model.</p>
<p>The matrixes we obtained through PCA were independent variables and we added the retention time of each compound as the dependent variable to form two new matrixes. The retention time of each compound was added into the matrixes consisted of principal components to form two new matrixes. Each matrix was separated into two groups randomly, of which one was the training group consisted of twenty samples and the other one was the testing group consisted of seven samples. Each line was a sample and every column except the last one was the independent variable and the last column was the dependent variable.</p>
<p>GA-BP was performed on these two matrixes respectively. The matrix was divided into training group (20 compounds) which was used in the inner loop for the model training and selection, and test group (7 compounds) utilized to validate the precision of model externally. In the inner loop, we utilized 5-fold cross validation which means that we separate the training group into five portions and take four portions for training and one for validation for five times. Then we compared the mean absolute error (MAE) value of these five model in the internal validation and selected the one whose MAE value is lowest to process external prediction (<xref ref-type="bibr" rid="B37">Roy and Arnbure, 2016</xref>). Levenberg-Marquart optimization algorithm (<xref ref-type="bibr" rid="B33">Raja et al., 2021</xref>) was chosen for training step in Matlab R2020a. The number of the hidden layers and hidden neurons of each layer is significant for the BP model. The addition of hidden layers can reduce the error but also can make the network complicate and increase the training time and the tendency of over-fit. A single sufficiently largely hidden layer is adequate for the approximation of most simple functions (<xref ref-type="bibr" rid="B34">Reed and Marks, 1999</xref>). So one hidden layer is enough and we can increase the number of hidden neurons to improve the precision. The number of hidden neurons was determined with the experimental function (1).<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:mi mathvariant="bold">h</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:msqrt>
<mml:mrow>
<mml:mi mathvariant="bold-italic">m</mml:mi>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:mrow>
</mml:msqrt>
<mml:mo>&#x2b;</mml:mo>
<mml:mi mathvariant="bold-italic">&#x3b1;</mml:mi>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">h</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo>,</mml:mo>
<mml:mtext>&#x2009;</mml:mtext>
<mml:mi mathvariant="bold-italic">m</mml:mi>
<mml:mo>&#x3c;</mml:mo>
<mml:mi mathvariant="bold-italic">N</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>h &#x3d; the number of hidden neurons, m &#x3d; the number of input nodes, n &#x3d; the output nodes, <italic>&#x3b1;</italic> &#x3d; adjustment constant between 1 and 10, and N &#x3d; the number of training samples.</p>
<p>To validate the accuracy of GA-BP models built for this study, the R<sup>2</sup>, the root-mean-square error prediction (RMSEP) and MAE were measured for an independent set of analytes that were completely separate from the training set used in creating a QSRR model. R<sup>2</sup> and RMSEP were defined as the function 2) (<xref ref-type="bibr" rid="B2">Alexander et al., 2015</xref>) and 3) (<xref ref-type="bibr" rid="B56">&#x17d;uvela et al., 2015</xref>) respectively.<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:msup>
<mml:mi mathvariant="bold-italic">R</mml:mi>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo>&#x2212;</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">o</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi mathvariant="bold-italic">s</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mi>/</mml:mi>
<mml:mo>&#x2211;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">o</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi mathvariant="bold-italic">s</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mover accent="true">
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
<disp-formula id="e3">
<mml:math id="m3">
<mml:mrow>
<mml:mi mathvariant="bold">R</mml:mi>
<mml:mi mathvariant="bold">M</mml:mi>
<mml:mi mathvariant="bold">S</mml:mi>
<mml:mi mathvariant="bold">E</mml:mi>
<mml:mi mathvariant="bold">P</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mroot>
<mml:mrow>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">o</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi mathvariant="bold-italic">s</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">o</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi mathvariant="bold-italic">s</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:msup>
<mml:mi>/</mml:mi>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:mrow>
</mml:mrow>
<mml:mn mathvariant="bold">2</mml:mn>
</mml:mroot>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
<disp-formula id="e4">
<mml:math id="m4">
<mml:mrow>
<mml:mi mathvariant="bold">M</mml:mi>
<mml:mi mathvariant="bold">A</mml:mi>
<mml:mi mathvariant="bold">E</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x2211;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn mathvariant="bold">1</mml:mn>
</mml:mrow>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:munderover>
<mml:mrow>
<mml:mo>&#x7c;</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">p</mml:mi>
<mml:mi mathvariant="bold-italic">r</mml:mi>
<mml:mi mathvariant="bold-italic">e</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi mathvariant="bold-italic">y</mml:mi>
<mml:mi mathvariant="bold-italic">i</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi mathvariant="bold-italic">o</mml:mi>
<mml:mi mathvariant="bold-italic">b</mml:mi>
<mml:mi mathvariant="bold-italic">s</mml:mi>
<mml:mi mathvariant="bold-italic">d</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mo>&#x7c;</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mi mathvariant="bold-italic">n</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>yi (obsd) &#x3d; observed retention time, <inline-formula id="inf1">
<mml:math id="m5">
<mml:mrow>
<mml:mover accent="true">
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mo>&#xaf;</mml:mo>
</mml:mover>
</mml:mrow>
</mml:math>
</inline-formula> &#x3d; the mean of observed retention time, yi (pred) &#x3d; predicted retention time, n &#x3d; the number of analytes.</p>
</sec>
<sec id="s2-3-4">
<title>Applicability domain</title>
<p>The purpose of establishing the QSRR model is to predict the retention value of new chemical entries falling within the applicability domain (AD) of the developed model. The reliability of any QSRR model relies on the confident predictions of these new compounds based on the AD of the model, and therein lies the importance of the AD study. Therefore, we harnessed an approach which has been reported to test the compounds we used whether were suitable. If the means of the S<sub>i</sub> (the corresponding standardized value for principal component <italic>i</italic> of one compound) values of a compound for all components in a model plus 1.28 times corresponding standard deviation (call it S<sub>new</sub>) is lower than 3, then there is 90% probability that the S<sub>i</sub> values of that compound are lower than 3. Thus, when S<sub>new</sub> value of a compound is lower than 3, then the compound can be considered to be not an X-outlier (if in the training group) or within the AD (if in the test group). (<xref ref-type="bibr" rid="B38">Roy et al., 2015</xref>).</p>
</sec>
</sec>
</sec>
<sec sec-type="results|discussion" id="s3">
<title>Results and discussion</title>
<sec id="s3-1">
<title>Generation of principal components</title>
<p>After the dimension reduction by the PCA, some components were obtained. The principal components were ranked according to the contribution rate and we selected the first few components whose cumulative contribution rate can reach 95% to form new matrixes. The matrix generated from the matrix without molecular interaction-based features was named matrix 1, the other one called matrix 2. The contribution rates of these principal components of two matrixes are shown in <xref ref-type="table" rid="T1">Table 1</xref> and <xref ref-type="table" rid="T2">Table 2</xref> (The principle components of each analyte of two matrixes were shown in <xref ref-type="sec" rid="s10">Supplementary Tables S3, S4</xref>).</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Principal Components and their contribution rates (PCA was performed on the matrix consisting of descriptors without molecular interaction-based features).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Principal components</th>
<th align="left">Contribution rates%</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">PC 1</td>
<td align="left">47.26435108</td>
</tr>
<tr>
<td align="left">PC 2</td>
<td align="left">21.77876205</td>
</tr>
<tr>
<td align="left">PC 3</td>
<td align="left">8.443341288</td>
</tr>
<tr>
<td align="left">PC 4</td>
<td align="left">6.057161663</td>
</tr>
<tr>
<td align="left">PC 5</td>
<td align="left">4.912323874</td>
</tr>
<tr>
<td align="left">PC 6</td>
<td align="left">3.076686032</td>
</tr>
<tr>
<td align="left">PC 7</td>
<td align="left">2.121700455</td>
</tr>
<tr>
<td align="left">PC 8</td>
<td align="left">1.393171762</td>
</tr>
<tr>
<td align="left">Total</td>
<td align="left">95.0474982</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Principal Components and their contribution rates (PCA was performed on the matrix consisting of descriptors with molecular interaction-based features).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Principal components</th>
<th align="left">Contribution rates%</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">PC&#x2032; 1</td>
<td align="left">45.58673414</td>
</tr>
<tr>
<td align="left">PC&#x2032; 2</td>
<td align="left">21.67436145</td>
</tr>
<tr>
<td align="left">PC&#x2032; 3</td>
<td align="left">8.723766792</td>
</tr>
<tr>
<td align="left">PC&#x2032; 4</td>
<td align="left">6.572024529</td>
</tr>
<tr>
<td align="left">PC&#x2032; 5</td>
<td align="left">4.802069629</td>
</tr>
<tr>
<td align="left">PC&#x2032; 6</td>
<td align="left">3.051923618</td>
</tr>
<tr>
<td align="left">PC&#x2032; 7</td>
<td align="left">2.139011586</td>
</tr>
<tr>
<td align="left">PC&#x2032; 8</td>
<td align="left">1.670127367</td>
</tr>
<tr>
<td align="left">PC&#x2032; 9</td>
<td align="left">1.249293494</td>
</tr>
<tr>
<td align="left">Total</td>
<td align="left">95.4693126</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>According to the results of PCA performed on different matrixes, when the molecular interaction-based features are added as new descriptors, one more component was gained and the contribution rates of principal components are different. Since the PCA can reduce the correlation of variables and change the closely related variables into as few new variables as possible, these new variables are not related in pairs. It suggests the molecular interaction-based features, to a certain extent, are independent of other descriptors.</p>
</sec>
<sec id="s3-2">
<title>Determination of the number of hidden neurons</title>
<p>With the selection range of the number of hidden neurons existing, we used each number to test on each matrix 20 frequencies respectively to find the optimum number of hidden neurons. The Regression R values measure the correlation between outputs and targets, meaning predicted retention time and observed retention time here. An R-value of 1 means a close relationship and 0 means a random relationship. We took whether the Regression R-value reaches 0.95 as a simple judgment criterion of the training model and counted the number of frequencies that R-value reaches 0.95 when the different number of hidden neurons was chosen to run. The results are shown in <xref ref-type="table" rid="T3">Table 3</xref> and <xref ref-type="table" rid="T4">Table 4</xref>.</p>
<table-wrap id="T3" position="float">
<label>TABLE 3</label>
<caption>
<p>The frequencies that R-value reaches 0.95 (performing on the training group of matrix 1).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">h</th>
<th colspan="4" align="left">The frequencies that R-value reaches 0.95</th>
<th rowspan="2" align="left">nr</th>
</tr>
<tr>
<th align="left">T<sub>1</sub>
</th>
<th align="left">V</th>
<th align="left">T<sub>2</sub>
</th>
<th align="left">A</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">4</td>
<td align="left">5</td>
<td align="left">5</td>
<td align="left">6</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">5</td>
<td align="left">5</td>
<td align="left">5</td>
<td align="left">3</td>
<td align="left">2</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">6</td>
<td align="left">12</td>
<td align="left">4</td>
<td align="left">3</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">7</td>
<td align="left">3</td>
<td align="left">6</td>
<td align="left">6</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">8</td>
<td align="left">8</td>
<td align="left">10</td>
<td align="left">5</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">9</td>
<td align="left">3</td>
<td align="left">6</td>
<td align="left">1</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">10</td>
<td align="left">8</td>
<td align="left">6</td>
<td align="left">5</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">11</td>
<td align="left">6</td>
<td align="left">10</td>
<td align="left">4</td>
<td align="left">1</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">12</td>
<td align="left">6</td>
<td align="left">7</td>
<td align="left">6</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">13</td>
<td align="left">11</td>
<td align="left">8</td>
<td align="left">2</td>
<td align="left">1</td>
<td align="left">0</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>h is the number of hidden neurons. T<sub>1</sub> is T1 Set. V is the V Set. T<sub>2</sub> is the T2 Set. A is the All Set. nr. is the frequencies that R values reach 0.95&#xa0;at the same time. (The names of four sets were given by algorithm contained in MATLAB automatically).</p>
</fn>
</table-wrap-foot>
</table-wrap>
<table-wrap id="T4" position="float">
<label>TABLE 4</label>
<caption>
<p>The frequencies that R-value reaches 0.95 (performing on the training group of matrix 2).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">h</th>
<th colspan="4" align="left">The frequencies that R-value reaches 0.95</th>
<th rowspan="2" align="left">nr</th>
</tr>
<tr>
<th align="left">T<sub>1</sub>
</th>
<th align="left">V</th>
<th align="left">T<sub>2</sub>
</th>
<th align="left">A</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">4</td>
<td align="left">3</td>
<td align="left">7</td>
<td align="left">4</td>
<td align="left">1</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">5</td>
<td align="left">2</td>
<td align="left">7</td>
<td align="left">6</td>
<td align="left">1</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">6</td>
<td align="left">12</td>
<td align="left">7</td>
<td align="left">4</td>
<td align="left">2</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">7</td>
<td align="left">6</td>
<td align="left">10</td>
<td align="left">6</td>
<td align="left">1</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">8</td>
<td align="left">5</td>
<td align="left">8</td>
<td align="left">2</td>
<td align="left">1</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">9</td>
<td align="left">8</td>
<td align="left">10</td>
<td align="left">7</td>
<td align="left">0</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">10</td>
<td align="left">7</td>
<td align="left">6</td>
<td align="left">1</td>
<td align="left">1</td>
<td align="left">0</td>
</tr>
<tr>
<td align="left">11</td>
<td align="left">7</td>
<td align="left">6</td>
<td align="left">3</td>
<td align="left">2</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">12</td>
<td align="left">11</td>
<td align="left">11</td>
<td align="left">5</td>
<td align="left">1</td>
<td align="left">1</td>
</tr>
<tr>
<td align="left">13</td>
<td align="left">7</td>
<td align="left">3</td>
<td align="left">8</td>
<td align="left">1</td>
<td align="left">0</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>h is the number of hidden neurons. T<sub>1</sub> is T1 Set. V is the V Set. T<sub>2</sub> is the T2 Test Set. A is the All Set. nr. is the frequencies that R values reach 0.95&#xa0;at the same time. (The names of four sets were given by algorithm contained in MATLAB automatically).</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>According to the results above, the frequencies that R-value reaches 0.95 of the All Set have been improved apparently when we added the molecular interaction-based features as molecular descriptors, which suggested they are beneficial for the accuracy of QSRR models. Meanwhile, the frequencies that R values of four sets reach 0.95 at the same time are improved as well. Through the running with different numbers of hidden neurons on different matrixes, we decided to choose 11 hidden neurons to perform the GA-BP algorithm. Because the R values of Training Set, Validation Set, Test Set, and All Set (for the avoidance of the conflict of names, we renamed them T1 set, V set and T2 set), which were assigned randomly by the Levenberg-Marquart optimization algorithm, can reach 0.95 at the same time when we took eleven hidden neurons to perform the algorithm on the training group of matrix 1 and 2 (After the PCA, the matrix generated from the matrix without molecular interaction-based features named matrix 1, the other one called matrix 2).</p>
</sec>
<sec id="s3-3">
<title>The establishment of the QSRR model</title>
<p>We took 11 hidden neurons and a double cross-validation approach to run GA-BP on the training groups of matrixes 1 and 2, and due to the random generation of weights initialization threshold, we take the same validation set to modelling 10 times respectively, then calculated the average of each training group (<xref ref-type="table" rid="T5">Table 5</xref>). Comparing the data shown in <xref ref-type="table" rid="T5">Table 5</xref>, we found that the MAE values of training groups whose principal components related to docking scores are mostly better than those without docking scores.</p>
<table-wrap id="T5" position="float">
<label>TABLE 5</label>
<caption>
<p>Selection of training models.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Matrix</th>
<th rowspan="2" align="left">k<sup>th</sup> fold</th>
<th colspan="10" align="left">MAE of each time</th>
<th rowspan="2" align="left">Average of MAE</th>
</tr>
<tr>
<th align="left">1</th>
<th align="left">2</th>
<th align="left">3</th>
<th align="left">4</th>
<th align="left">5</th>
<th align="left">6</th>
<th align="left">7</th>
<th align="left">8</th>
<th align="left">9</th>
<th align="left">10</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td rowspan="5" align="left">1</td>
<td align="left">k1</td>
<td align="left">2.6385</td>
<td align="left">0.5536</td>
<td align="left">1.5793</td>
<td align="left">2.6044</td>
<td align="left">4.8188</td>
<td align="left">6.0193</td>
<td align="left">2.501</td>
<td align="left">1.9305</td>
<td align="left">3.6009</td>
<td align="left">5.6812</td>
<td align="left">3.19275</td>
</tr>
<tr>
<td align="left">k2</td>
<td align="left">3.2298</td>
<td align="left">3.673</td>
<td align="left">4.0849</td>
<td align="left">3.501</td>
<td align="left">4.63</td>
<td align="left">4.0765</td>
<td align="left">4.0895</td>
<td align="left">4.092</td>
<td align="left">3.7948</td>
<td align="left">4.5111</td>
<td align="left">3.96826</td>
</tr>
<tr>
<td align="left">k3</td>
<td align="left">2.2915</td>
<td align="left">2.2608</td>
<td align="left">1.7267</td>
<td align="left">2.3488</td>
<td align="left">2.4065</td>
<td align="left">2.2028</td>
<td align="left">3.1336</td>
<td align="left">2.853</td>
<td align="left">2.3739</td>
<td align="left">2.2169</td>
<td align="left">2.38145</td>
</tr>
<tr>
<td align="left">k4</td>
<td align="left">3.7133</td>
<td align="left">3.6514</td>
<td align="left">1.6232</td>
<td align="left">5.1061</td>
<td align="left">1.8693</td>
<td align="left">5.9359</td>
<td align="left">4.5440</td>
<td align="left">4.6063</td>
<td align="left">2.0027</td>
<td align="left">3.9845</td>
<td align="left">3.703671</td>
</tr>
<tr>
<td align="left">k5</td>
<td align="left">2.9817</td>
<td align="left">4.4447</td>
<td align="left">2.6844</td>
<td align="left">3.2713</td>
<td align="left">2.4513</td>
<td align="left">4.9758</td>
<td align="left">1.4086</td>
<td align="left">3.158</td>
<td align="left">2.4287</td>
<td align="left">2.6385</td>
<td align="left">3.0443</td>
</tr>
<tr>
<td rowspan="5" align="left">2</td>
<td align="left">k1&#x2032;</td>
<td align="left">2.1501</td>
<td align="left">2.6904</td>
<td align="left">2.3996</td>
<td align="left">3.408</td>
<td align="left">4.8782</td>
<td align="left">1.8289</td>
<td align="left">2.0223</td>
<td align="left">3.0861</td>
<td align="left">3.2268</td>
<td align="left">2.6011</td>
<td align="left">2.82915</td>
</tr>
<tr>
<td align="left">k2&#x2032;</td>
<td align="left">3.8125</td>
<td align="left">3.0321</td>
<td align="left">3.1707</td>
<td align="left">3.9484</td>
<td align="left">1.9685</td>
<td align="left">3.6707</td>
<td align="left">3.8672</td>
<td align="left">2.2259</td>
<td align="left">4.965</td>
<td align="left">2.3368</td>
<td align="left">3.29978</td>
</tr>
<tr>
<td align="left">k3&#x2032;</td>
<td align="left">2.0024</td>
<td align="left">2.7605</td>
<td align="left">3.0042</td>
<td align="left">3.2663</td>
<td align="left">2.4173</td>
<td align="left">2.8182</td>
<td align="left">1.9522</td>
<td align="left">2.6188</td>
<td align="left">0.8307</td>
<td align="left">1.4076</td>
<td align="left">2.30782</td>
</tr>
<tr>
<td align="left">k4&#x2032;</td>
<td align="left">1.9059</td>
<td align="left">3.5847</td>
<td align="left">1.8069</td>
<td align="left">3.0382</td>
<td align="left">1.9059</td>
<td align="left">3.8669</td>
<td align="left">0.9266</td>
<td align="left">1.8069</td>
<td align="left">3.0382</td>
<td align="left">3.0382</td>
<td align="left">2.49184</td>
</tr>
<tr>
<td align="left">k5&#x2032;</td>
<td align="left">4.3536</td>
<td align="left">3.5158</td>
<td align="left">4.0454</td>
<td align="left">1.1736</td>
<td align="left">1.63</td>
<td align="left">4.085</td>
<td align="left">3.2323</td>
<td align="left">5.0584</td>
<td align="left">1.3107</td>
<td align="left">0.822</td>
<td align="left">2.92268</td>
</tr>
</tbody>
</table>
<table-wrap-foot>
<fn>
<p>k<sup>th</sup> fold means which one of the five portions was taken as validation test.</p>
</fn>
</table-wrap-foot>
</table-wrap>
<p>According to the averages of MAE values, we chose the third portion as the validation set in the inner loop of matrices 1 and 2. Then we used a test group to perform external prediction. The results are shown in <xref ref-type="fig" rid="F3">Figure 3</xref> which were the linear relationships of the predicted retention time obtained by using training models together with measured retention time and <xref ref-type="table" rid="T6">Table 6</xref>. The R<sup>2</sup> values of both test groups are greater than 0.6, suggesting the models are not rejected irrespective of the absolute error (<xref ref-type="bibr" rid="B2">Alexander et al., 2015</xref>). But when we put molecular interaction-based features into running, the RMSEP value had no apparent improvement, which has areas for further optimism. However, the MAE value becomes better. It manifested the molecular interaction-based features as an independent category of descriptors that were helpful to the establishment of the QSRR model to predict the retention time of hydroxamic acid.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>Comparison of test results of two matrixes. [<bold>(A)</bold> was the test group of matrix 1, and <bold>(B)</bold> was the test group of matrix 2].</p>
</caption>
<graphic xlink:href="fchem-10-1056701-g003.tif"/>
</fig>
<table-wrap id="T6" position="float">
<label>TABLE 6</label>
<caption>
<p>Prediction of the retention time of compounds in the testing set.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Analytes</th>
<th align="left">Predicted retention time/min (model 1)</th>
<th align="left">Predicted retention time 2/min (model 2)</th>
<th align="left">Observed retention time/min</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx1.tif"/>
</td>
<td align="left">7.200123</td>
<td align="left">9.573565</td>
<td align="left">10.04</td>
</tr>
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx2.tif"/>
</td>
<td align="left">7.421031</td>
<td align="left">8.218716</td>
<td align="left">10.1</td>
</tr>
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx3.tif"/>
</td>
<td align="left">2.909212</td>
<td align="left">5.000308</td>
<td align="left">2.38</td>
</tr>
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx4.tif"/>
</td>
<td align="left">5.623486</td>
<td align="left">2.573642</td>
<td align="left">2.86</td>
</tr>
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx5.tif"/>
</td>
<td align="left">4.237541</td>
<td align="left">3.273094</td>
<td align="left">2.7</td>
</tr>
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx6.tif"/>
</td>
<td align="left">4.096308</td>
<td align="left">3.965852</td>
<td align="left">3.54</td>
</tr>
<tr>
<td align="left">
<inline-graphic xlink:href="FCHEM_fchem-2022-1056701_wc_tfx7.tif"/>
</td>
<td align="left">3.606235</td>
<td align="left">3.847673</td>
<td align="left">3.22</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3-4">
<title>Applicability domain</title>
<p>We performed the reported program to calculate the Snew values of our compounds. The result was shown in <xref ref-type="fig" rid="F4">Figure 4</xref>. The Snew values of all the compounds we used are lower than 3, which means they are suitable for the model and not X-outlier (if in the training group) or within the AD (if in the test group).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Applicability domain.</p>
</caption>
<graphic xlink:href="fchem-10-1056701-g004.tif"/>
</fig>
</sec>
<sec id="s3-5">
<title>Detection of systematic error in predictions</title>
<p>For the determination of the quality of QSRR-derived predictions, we calculated the following five values: ratio of the number of positive and negative errors (NPE/NNE), absolute (ABS) of average error (AE) with mean absolute error (MAE), mean positive error (MPE) with mean negative error (MNE). The data was shown in <xref ref-type="table" rid="T7">Table 7</xref>.</p>
<table-wrap id="T7" position="float">
<label>TABLE 7</label>
<caption>
<p>Detection of systematic error in predictions.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">QSRR model</th>
<th align="left">NPE</th>
<th align="left">NNE</th>
<th align="left">MPE</th>
<th align="left">MNE</th>
<th align="left">MAE</th>
<th align="left">AE</th>
<th align="left">NPE/NNE or NNE/NPE</th>
<th align="left">ABS(MPE/MNE)</th>
<th align="left">MAE-ABS(AE)</th>
<th align="left">R<sup>2</sup> (<italic>i</italic>
<sup>th</sup> vs. (i-1)<sup>th</sup> residuals)</th>
<th align="left">R<sup>2</sup> (Y pred vs. residuals)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">model 1</td>
<td align="left">3</td>
<td align="left">4</td>
<td align="left">0.75</td>
<td align="left">-0.92</td>
<td align="left">1.53</td>
<td align="left">0.04</td>
<td align="char" char="/">0.75/1.33</td>
<td align="left">0.81912</td>
<td align="left">1.501264</td>
<td align="left">0.0582</td>
<td align="left">0.2099</td>
</tr>
<tr>
<td align="left">model 2</td>
<td align="left">3</td>
<td align="left">4</td>
<td align="left">1.06</td>
<td align="left">-0.89</td>
<td align="left">0.57</td>
<td align="left">0.23</td>
<td align="char" char="/">0.75/1.33</td>
<td align="left">1.209227</td>
<td align="left">0.342687</td>
<td align="left">0.0302</td>
<td align="left">0.4208</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Recording to the reported criterions: 1) NPE/NNE &#x3e;5 or NNE/NPE &#x3e;5; 2) ABS(MPE/MNE) &#x3e; 2 or ABS(MNE/MPE) &#x3e; 2; 3) MAE - ABS(AE) &#x3c; 0.5&#xd7;MAE; 4) R<sup>2</sup> (<italic>i</italic>
<sup>th</sup> vs. (i-1)<sup>th</sup> residuals) &#x3e; 0.5 for residuals sorted on Y<sub>pred</sub>; 5) R<sup>2</sup>(Y vs. residuals) &#x3e; 0.5 [57], even if our models are not satisfy, in the future work, we need more analytes to improve, due to not satisfying the standard of number (at least 10).</p>
</sec>
<sec id="s3-6">
<title>PLS using docking scores</title>
<p>To investigate the relationship between molecular interaction-based features and retention time of compounds, we used molecular docking scores alone to run the PLS algorism in Matlab. Fifteen analytes were used as a training group to generate the coefficients of each type of docking score and the constant term. The simulation training and predicting of the test group were following (<xref ref-type="fig" rid="F5">Figure 5</xref>). We found that a remarkable error existed between the predicted retention time and observed retention time. Our results suggested the regression using molecular interaction-based features alone to construct the QSRR model is unfeasible.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>
<bold>(A)</bold> The predicted retention time obtained by PLS method vs. observed retention time; <bold>(B)</bold> The prediction error of PLS for each analyte of the test group.</p>
</caption>
<graphic xlink:href="fchem-10-1056701-g005.tif"/>
</fig>
</sec>
<sec id="s3-7">
<title>Analyze of the relevance between molecular interaction-based features and retention time</title>
<p>We took the molecular docking results of two analytes (analyte 6 and 23 are shown in <xref ref-type="sec" rid="s10">Supplementary Table S1</xref> and <xref ref-type="fig" rid="F6">Figure 6</xref>), whose retention time is notably different (14.86&#xa0;min <italic>vs</italic> 2.38&#xa0;min), to investigate the relevance. The docking results are shown in <xref ref-type="fig" rid="F6">Figures 6A,B</xref>. Obviously, analyte 6 could occupy larger area of ODS surface than analyte 23. As expected, the docking scores of analyte 6 are larger than that of analyte 23 (<xref ref-type="fig" rid="F6">Figure 6C</xref>). Therefore, if the analytes could occupy more area of the material, it could generate more interaction force between these two things and have better docking result (larger minus) and large retention values. So, these molecular interaction-based features could be helpful to the prediction of analytes and improve the precision of QSRR models.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>
<bold>(A)</bold> The docking result of analyte 6. <bold>(B)</bold> The docking result of analyte 23. <bold>(C)</bold> Comparison of molecular docking scores (molecular interaction-based features) of analyte 6 and 23.</p>
</caption>
<graphic xlink:href="fchem-10-1056701-g006.tif"/>
</fig>
</sec>
</sec>
<sec sec-type="conclusion" id="s4">
<title>Conclusion</title>
<p>The PCA-GA-BP method was employed to establish QSRR models for hydroxamic acids and the double cross-validation approach using internal 5-fold cross validation guaranteed the reliability of training model and exploited finite training compounds sufficiently. The interaction between analytes and solid-phase materials was measured using molecular docking scores, which were introduced as new features in the QSRR model. These features could manifest the strength of interaction between analytes and solid-phase material (At least in the docking of drug molecules and proteins). As a new type of molecular descriptors, molecular interaction-based features (docking scores) could contribute to the dimension reduction, selection of hidden neurons, model selection and prediction of retention time. Our QSRR model could be used to predict the retention time of hydroxamic acids.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The original contributions presented in the study are included in the article/<xref ref-type="sec" rid="s10">Supplementary Materials</xref>, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>YN: Methodology, Software, Validation, Investigation, Writing&#x2014;original draft. JL: Validation, Resources. XY: Validation, Resources. XH: Conceptualization, Methodology, Resources, Writing&#x2014;review and editing. HF: Conceptualization, Methodology, Resources, Writing&#x2014;review and editing.</p>
</sec>
<sec id="s7">
<title>Funding</title>
<p>This work was supported by the National Nature Science Foundation of China (81874288, 92053105, and 82003590), the Shandong Provincial Natural Science Foundation (ZR2019LZL004 and ZR2020QH342).</p>
</sec>
<ack>
<p>We genuinely thank the Advanced Medical Research Institute, Shandong University, for their help in the experiments.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fchem.2022.1056701/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fchem.2022.1056701/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM1" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Adekoya</surname>
<given-names>O. C.</given-names>
</name>
<name>
<surname>Adekoya</surname>
<given-names>G. J.</given-names>
</name>
<name>
<surname>Sadiku</surname>
<given-names>E. R.</given-names>
</name>
<name>
<surname>Hamam</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Ray</surname>
<given-names>S. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Application of DFT calculations in designing polymer-based drug delivery systems: An overview</article-title>. <source>Pharmaceutics</source> <volume>14</volume> (<issue>9</issue>), <fpage>1972</fpage>. <pub-id pub-id-type="doi">10.3390/pharmaceutics14091972</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alexander</surname>
<given-names>D. L.</given-names>
</name>
<name>
<surname>Tropsha</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Winkler</surname>
<given-names>D. A.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Beware of R(2): Simple, unambiguous assessment of the prediction accuracy of QSAR and QSPR models</article-title>. <source>J. Chem. Inf. Model.</source> <volume>55</volume> (<issue>7</issue>), <fpage>1316</fpage>&#x2013;<lpage>1322</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.5b00206</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bahmani</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Tanzadehpanah</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Hosseinpour Moghadam</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Saidijam</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Introducing a pyrazolopyrimidine as a multi-tyrosine kinase inhibitor, using multi-QSAR and docking methods</article-title>. <source>Mol. Divers.</source> <volume>25</volume> (<issue>2</issue>), <fpage>949</fpage>&#x2013;<lpage>965</lpage>. <pub-id pub-id-type="doi">10.1007/s11030-020-10080-8</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becke</surname>
<given-names>A. D.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>A new mixing of Hartree&#x2013;Fock and local density&#x2010;functional theories</article-title>. <source>J. Chem. Phys.</source> <volume>98</volume> (<issue>2</issue>), <fpage>1372</fpage>&#x2013;<lpage>1377</lpage>. <pub-id pub-id-type="doi">10.1063/1.464304</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Becke</surname>
<given-names>A. D.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Density-functional exchange-energy approximation with correct asymptotic behavior</article-title>. <source>Phys. Rev. A . Coll. Park.</source> <volume>38</volume> (<issue>6</issue>), <fpage>3098</fpage>&#x2013;<lpage>3100</lpage>. <pub-id pub-id-type="doi">10.1103/physreva.38.3098</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brambilla</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Pires</surname>
<given-names>G. P.</given-names>
</name>
<name>
<surname>dos Santos</surname>
<given-names>J. H.</given-names>
</name>
<name>
<surname>Miranda</surname>
<given-names>M. S. L.</given-names>
</name>
<name>
<surname>Chornik</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Octadecylsilane-modified silicas prepared by grafting and sol&#x2013;gel methods</article-title>. <source>J. Electron Spectrosc. Relat. Phenom.</source> <volume>156-158</volume>, <fpage>413</fpage>&#x2013;<lpage>420</lpage>. <pub-id pub-id-type="doi">10.1016/j.elspec.2006.12.053</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Calais</surname>
<given-names>J.-L.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Density-functional theory of atoms and molecules. R.G. Parr and W. Yang, oxford university press, New York, oxford, 1989. IX &#x2b; 333 pp. Price &#xa3;45.00</article-title>. <source>Int. J. Quantum Chem.</source> <volume>47</volume> (<issue>1</issue>), <fpage>101</fpage>. <pub-id pub-id-type="doi">10.1002/qua.560470107</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Clark</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cramer</surname>
<given-names>R. D.</given-names>
<suffix>Iii</suffix>
</name>
<name>
<surname>Van Opdenbosch</surname>
<given-names>N.</given-names>
</name>
</person-group> (<year>1989</year>). <article-title>Validation of the general purpose tripos 5.2 force field</article-title>. <source>J. Comput. Chem.</source> <volume>10</volume> (<issue>8</issue>), <fpage>982</fpage>&#x2013;<lpage>1012</lpage>. <pub-id pub-id-type="doi">10.1002/jcc.540100804</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Eldridge</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Murray</surname>
<given-names>C. W.</given-names>
</name>
<name>
<surname>Auton</surname>
<given-names>T. R.</given-names>
</name>
<name>
<surname>Paolini</surname>
<given-names>G. V.</given-names>
</name>
<name>
<surname>Mee</surname>
<given-names>R. P.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Empirical scoring functions: I. The development of a fast empirical scoring function to estimate the binding affinity of ligands in receptor complexes</article-title>. <source>J. Comput. Aided. Mol. Des.</source> <volume>11</volume> (<issue>5</issue>), <fpage>425</fpage>&#x2013;<lpage>445</lpage>. <pub-id pub-id-type="doi">10.1023/a:1007996124545</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Zhu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Numerical simulation of closed plastic impeller molding process and its parameter optimization</article-title>. <source>Sci. Rep.</source> <volume>12</volume> (<issue>1</issue>), <fpage>17335</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-022-22260-7</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Frisch</surname>
<given-names>M. J.</given-names>
</name>
<name>
<surname>Pople</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Binkley</surname>
<given-names>J. S.</given-names>
</name>
</person-group> (<year>1984</year>). <article-title>Self&#x2010;consistent molecular orbital methods 25. Supplementary functions for Gaussian basis sets</article-title>. <source>J. Chem. Phys.</source> <volume>80</volume> (<issue>7</issue>), <fpage>3265</fpage>&#x2013;<lpage>3269</lpage>. <pub-id pub-id-type="doi">10.1063/1.447079</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fu</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Dun</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Gong</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Design, synthesis and biological evaluation of saccharin-based N-hydroxybenzamides as histone deacetylases (HDACs) inhibitors</article-title>. <source>Bioorg. Med. Chem.</source> <volume>23</volume> (<issue>17</issue>), <fpage>5774</fpage>&#x2013;<lpage>5781</lpage>. <pub-id pub-id-type="doi">10.1016/j.bmc.2015.07.008</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ganesh</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Poorna Basuri</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Sahini</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Nalini</surname>
<given-names>C. N.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Retention behaviour of analytes in reversed-phase high-performance liquid chromatography-A review</article-title>. <source>Biomed. Chromatogr.</source>, <fpage>e5482</fpage>. <pub-id pub-id-type="doi">10.1002/bmc.5482</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gilson</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Rashin</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Fine</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Honig</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>1985</year>). <article-title>On the calculation of electrostatic interactions in proteins</article-title>. <source>J. Mol. Biol.</source> <volume>184</volume> (<issue>3</issue>), <fpage>503</fpage>&#x2013;<lpage>516</lpage>. <pub-id pub-id-type="doi">10.1016/0022-2836(85)90297-9</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ho</surname>
<given-names>T. C. S.</given-names>
</name>
<name>
<surname>Chan</surname>
<given-names>A. H. Y.</given-names>
</name>
<name>
<surname>Ganesan</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Thirty years of HDAC inhibitors: 2020 insight and hindsight</article-title>. <source>J. Med. Chem.</source> <volume>63</volume> (<issue>21</issue>), <fpage>12460</fpage>&#x2013;<lpage>12484</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jmedchem.0c00830</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jain</surname>
<given-names>A. N.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Surflex-Dock 2.1: Robust performance from ligand energetic modeling, ring flexibility, and knowledge-based search</article-title>. <source>J. Comput. Aided. Mol. Des.</source> <volume>21</volume> (<issue>5</issue>), <fpage>281</fpage>&#x2013;<lpage>306</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-007-9114-2</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jones</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Willett</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Glen</surname>
<given-names>R. C.</given-names>
</name>
<name>
<surname>Leach</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Taylor</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>1997</year>). <article-title>Development and validation of a genetic algorithm for flexible docking 1 1Edited by F. E. Cohen</article-title>. <source>J. Mol. Biol.</source> <volume>267</volume> (<issue>3</issue>), <fpage>727</fpage>&#x2013;<lpage>748</lpage>. <pub-id pub-id-type="doi">10.1006/jmbi.1996.0897</pub-id>
</citation>
</ref>
<ref id="B18">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Koch</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Holthausen</surname>
<given-names>M. C.</given-names>
</name>
</person-group> (<year>2001</year>). <source>A chemist&#x27;s guide to density functional theory</source>. <edition>second ed.</edition> <publisher-loc>Weinheim, Germany</publisher-loc>: <publisher-name>Wiley VCH</publisher-name>.</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kuntz</surname>
<given-names>I. D.</given-names>
</name>
<name>
<surname>Blaney</surname>
<given-names>J. M.</given-names>
</name>
<name>
<surname>Oatley</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Langridge</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ferrin</surname>
<given-names>T. E.</given-names>
</name>
</person-group> (<year>1982</year>). <article-title>A geometric approach to macromolecule-ligand interactions</article-title>. <source>J. Mol. Biol.</source> <volume>161</volume> (<issue>2</issue>), <fpage>269</fpage>&#x2013;<lpage>288</lpage>. <pub-id pub-id-type="doi">10.1016/0022-2836(82)90153-x</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ledesma</surname>
<given-names>E. B.</given-names>
</name>
<name>
<surname>Wornat</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>QSRR prediction of chromatographic retention of ethynyl-substituted PAH from semiempirically computed solute descriptors</article-title>. <source>Anal. Chem.</source> <volume>72</volume> (<issue>21</issue>), <fpage>5437</fpage>&#x2013;<lpage>5443</lpage>. <pub-id pub-id-type="doi">10.1021/ac000296r</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Parr</surname>
<given-names>R. G.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Development of the Colle-Salvetti correlation-energy formula into a functional of the electron density</article-title>. <source>Phys. Rev. B</source> <volume>37</volume> (<issue>2</issue>), <fpage>785</fpage>&#x2013;<lpage>789</lpage>. <pub-id pub-id-type="doi">10.1103/physrevb.37.785</pub-id>
</citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Cheng</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Tong</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Forecasting of bioaerosol concentration by a Back Propagation neural network model</article-title>. <source>Sci. Total Environ.</source> <volume>698</volume>, <fpage>134315</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2019.134315</pub-id>
</citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liang</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Gao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>S.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>The mechanism research on the anti-liver fibrosis of emodin based on network pharmacology</article-title>. <source>IUBMB Life</source> <volume>73</volume> (<issue>9</issue>), <fpage>1166</fpage>&#x2013;<lpage>1179</lpage>. <pub-id pub-id-type="doi">10.1002/iub.2523</pub-id>
</citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Fang</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Design and synthesis of a new generation of substituted purine hydroxamate analogs as histone deacetylase inhibitors</article-title>. <source>Bioorg. Med. Chem.</source> <volume>24</volume> (<issue>7</issue>), <fpage>1446</fpage>&#x2013;<lpage>1454</lpage>. <pub-id pub-id-type="doi">10.1016/j.bmc.2016.02.005</pub-id>
</citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Luo</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wei</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>X.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Excited states and photodebromination of selected polybrominated diphenyl ethers: Computational and quantitative structure--property relationship studies</article-title>. <source>Int. J. Mol. Sci.</source> <volume>16</volume> (<issue>1</issue>), <fpage>1160</fpage>&#x2013;<lpage>1178</lpage>. <pub-id pub-id-type="doi">10.3390/ijms16011160</pub-id>
</citation>
</ref>
<ref id="B26">
<citation citation-type="book">
<collab>Matlab</collab> (<year>2013</year>). <source>Matlab</source>. <publisher-loc>Natick, MA, USA</publisher-loc>: <publisher-name>The Mathworks Inc.</publisher-name>
</citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mirrahimi</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Salahinejad</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Ghasemi</surname>
<given-names>J. B.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>QSPR approaches to elucidate the stability constants between &#x3b2;-cyclodextrin and some organic compounds: Docking based 3D conformer</article-title>. <source>J. Mol. Liq.</source> <volume>219</volume>, <fpage>1036</fpage>&#x2013;<lpage>1043</lpage>. <pub-id pub-id-type="doi">10.1016/j.molliq.2016.04.037</pub-id>
</citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Motoc</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Dammkoehler</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Mayer</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Labanowski</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1986</year>). <article-title>Three&#x2010;Dimensional quantitative structure&#x2010;activity relationships I. General approach to the pharmacophore model validation</article-title>. <source>Quant. Struct. -Act. Relat.</source> <volume>5</volume>, <fpage>99</fpage>&#x2013;<lpage>105</lpage>. <pub-id pub-id-type="doi">10.1002/qsar.19860050305</pub-id>
</citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Muegge</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Martin</surname>
<given-names>Y. C.</given-names>
</name>
</person-group> (<year>1999</year>). <article-title>A general and fast scoring function for protein-ligand interactions: A simplified potential approach</article-title>. <source>J. Med. Chem.</source> <volume>42</volume> (<issue>5</issue>), <fpage>791</fpage>&#x2013;<lpage>804</lpage>. <pub-id pub-id-type="doi">10.1021/jm980536j</pub-id>
</citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pan</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Z.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Quantitative structure-property relationship studies for predicting flash points of alkanes using group bond contribution method with back-propagation neural network</article-title>. <source>J. Hazard. Mat.</source> <volume>147</volume> (<issue>1-2</issue>), <fpage>424</fpage>&#x2013;<lpage>430</lpage>. <pub-id pub-id-type="doi">10.1016/j.jhazmat.2007.01.025</pub-id>
</citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Prasad</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Raut</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Goel</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Barnwal</surname>
<given-names>R. P.</given-names>
</name>
<name>
<surname>Bodhe</surname>
<given-names>G. L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Electronic nose and wireless sensor network for environmental monitoring application in pulp and paper industry: A review</article-title>. <source>Environ. Monit. Assess.</source> <volume>194</volume> (<issue>12</issue>), <fpage>855</fpage>. <pub-id pub-id-type="doi">10.1007/s10661-022-10479-w</pub-id>
</citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Purohit</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Saini</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Narasimhan</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Three-dimensional quantitative structure-activity relationship (3DQSAR) and molecular docking study of 2-((pyridin-3-yloxy)methyl) piperazines as &#x3b1;7 nicotinic acetylcholine receptor modulators for the treatment of inflammatory disorders</article-title>. <source>Mini Rev. Med. Chem.</source> <volume>20</volume> (<issue>11</issue>), <fpage>1031</fpage>&#x2013;<lpage>1041</lpage>. <pub-id pub-id-type="doi">10.2174/1389557519666190904151227</pub-id>
</citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raja</surname>
<given-names>M. A. Z.</given-names>
</name>
<name>
<surname>Sabati</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Parveen</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Awais</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Awan</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Chaudhary</surname>
<given-names>N. I.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Integrated intelligent computing application for effectiveness of Au nanoparticles coated over MWCNTs with velocity slip in curved channel peristaltic flow</article-title>. <source>Sci. Rep.</source> <volume>11</volume> (<issue>1</issue>), <fpage>22550</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-021-98490-y</pub-id>
</citation>
</ref>
<ref id="B34">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Reed</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Marks</surname>
<given-names>R. J.</given-names>
</name>
</person-group> (<year>1999</year>). <source>Neural smithing</source>. <publisher-loc>Cambridge, MA</publisher-loc>: <publisher-name>MIT Press</publisher-name>.</citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roberto Todeschini</surname>
<given-names>V. C.</given-names>
</name>
<name>
<surname>Consonni</surname>
<given-names>V.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Handbook of molecular descriptors</article-title>. <source>Methods Princ. Med. Chem.</source> <pub-id pub-id-type="doi">10.1002/9783527613106</pub-id>
</citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roman</surname>
<given-names>K.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>QSRR quantitative structure-(chromatographic) retention relationships</article-title>. <source>Chem. Rev.</source> <volume>107</volume>, <fpage>3212</fpage>&#x2013;<lpage>3246</lpage>. <pub-id pub-id-type="doi">10.1021/cr068412z</pub-id>
</citation>
</ref>
<ref id="B37">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roy</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Arnbure</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>The "double cross-validation" software tool for MLR QSAR model development</article-title>. <source>Chemom. Intelligent Laboratory Syst.</source> <volume>159</volume>, <fpage>108</fpage>&#x2013;<lpage>126</lpage>. <pub-id pub-id-type="doi">10.1016/j.chemolab.2016.10.009</pub-id>
</citation>
</ref>
<ref id="B38">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Roy</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Kar</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ambure</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>On a simple approach for determining applicability domain of QSAR models</article-title>. <source>Chemom. Intelligent Laboratory Syst.</source> <volume>145</volume>, <fpage>22</fpage>&#x2013;<lpage>29</lpage>. <pub-id pub-id-type="doi">10.1016/j.chemolab.2015.04.013</pub-id>
</citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sakr</surname>
<given-names>M. A. S.</given-names>
</name>
<name>
<surname>Sherbiny</surname>
<given-names>F. F.</given-names>
</name>
<name>
<surname>El-Etrawy</surname>
<given-names>A. S.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>Hydrazone-based materials; DFT, TD-DFT, NBO analysis, fukui function, MESP analysis, and solar cell applications</article-title>. <source>J. Fluoresc.</source> <volume>32</volume> (<issue>5</issue>), <fpage>1857</fpage>&#x2013;<lpage>1871</lpage>. <pub-id pub-id-type="doi">10.1007/s10895-022-03000-6</pub-id>
</citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sanyal</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Amin</surname>
<given-names>S. A.</given-names>
</name>
<name>
<surname>Banerjee</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Gayen</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Jha</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>A review of MMP-2 structures and binding mode analysis of its inhibitors to strategize structure-based drug design</article-title>. <source>Bioorg. Med. Chem.</source> <volume>74</volume>, <fpage>117044</fpage>. <pub-id pub-id-type="doi">10.1016/j.bmc.2022.117044</pub-id>
</citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schaal</surname>
<given-names>J. B.</given-names>
</name>
<name>
<surname>Maretzky</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tran</surname>
<given-names>D. Q.</given-names>
</name>
<name>
<surname>Tran</surname>
<given-names>P. A.</given-names>
</name>
<name>
<surname>Tongaonkar</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Blobel</surname>
<given-names>C. P.</given-names>
</name>
<etal/>
</person-group> (<year>2018</year>). <article-title>Macrocyclic &#x3b8;-defensins suppress tumor necrosis factor-&#x3b1; (TNF-&#x3b1;) shedding by inhibition of TNF-&#x3b1;-converting enzyme</article-title>. <source>J. Biol. Chem.</source> <volume>293</volume> (<issue>8</issue>), <fpage>2725</fpage>&#x2013;<lpage>2734</lpage>. <pub-id pub-id-type="doi">10.1074/jbc.ra117.000793</pub-id>
</citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Sharp</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Honig</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Electrostatic interactions in macromolecules: Theory and applications</article-title>. <source>Annu. Rev. Biophys. Biophys. Chem.</source> <volume>19</volume>, <fpage>301</fpage>&#x2013;<lpage>332</lpage>. <pub-id pub-id-type="doi">10.1146/annurev.bb.19.060190.001505</pub-id>
</citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Singh</surname>
<given-names>R. R.</given-names>
</name>
<name>
<surname>Rajnarayanan</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Aga</surname>
<given-names>D. S.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Binding of iodinated contrast media (ICM) and their transformation products with hormone receptors: Are ICM the new EDCs?</article-title> <source>Sci. Total Environ.</source> <volume>692</volume>, <fpage>32</fpage>&#x2013;<lpage>36</lpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2019.07.159</pub-id>
</citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stephens</surname>
<given-names>P. J.</given-names>
</name>
<name>
<surname>Devlin</surname>
<given-names>F. J.</given-names>
</name>
<name>
<surname>Chabalowski</surname>
<given-names>C. F.</given-names>
</name>
<name>
<surname>Frisch</surname>
<given-names>M. J.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>
<italic>Ab-initio</italic> calculation of vibrational absorption and circular-dichroism spectra using density-functional force-fields</article-title>. <source>J. Phys. Chem.</source> <volume>98</volume> (<issue>45</issue>), <fpage>11623</fpage>&#x2013;<lpage>11627</lpage>. <pub-id pub-id-type="doi">10.1021/j100096a001</pub-id>
</citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Stewart</surname>
<given-names>J. J.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Optimization of parameters for semiempirical methods VI: More modifications to the NDDO approximations and re-optimization of parameters</article-title>. <source>J. Mol. Model.</source> <volume>19</volume> (<issue>1</issue>), <fpage>1</fpage>&#x2013;<lpage>32</lpage>. <pub-id pub-id-type="doi">10.1007/s00894-012-1667-x</pub-id>
</citation>
</ref>
<ref id="B46">
<citation citation-type="book">
<collab>SYBYL</collab> (<year>2012</year>). <source>SYBYL&#xae; is available from Tripos Inc., S.L., MO 63144</source>. <publisher-loc>St. Louis, USA</publisher-loc>: <publisher-name>Tripos International</publisher-name>.</citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Tomasi</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Persico</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>1994</year>). <article-title>Molecular interactions in solution: An overview of methods based on continuous distributions of the solvent</article-title>. <source>Chem. Rev.</source> <volume>94</volume> (<issue>7</issue>), <fpage>2027</fpage>&#x2013;<lpage>2094</lpage>. <pub-id pub-id-type="doi">10.1021/cr00031a013</pub-id>
</citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Turner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Deeth</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Platts</surname>
<given-names>J. A.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Prediction of ligand effects in platinum-amyloid-&#x3b2; coordination</article-title>. <source>J. Inorg. Biochem.</source> <volume>173</volume>, <fpage>44</fpage>&#x2013;<lpage>51</lpage>. <pub-id pub-id-type="doi">10.1016/j.jinorgbio.2017.05.003</pub-id>
</citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Waltho</surname>
<given-names>J. P.</given-names>
</name>
<name>
<surname>Vinter</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Williams</surname>
<given-names>D. H.</given-names>
</name>
</person-group> (<year>1988</year>). <article-title>Forces in molecular recognition: Comparison of experimental data and molecular mechanics calculations</article-title>. <source>J. Comput. Aided. Mol. Des.</source> <volume>2</volume> (<issue>1</issue>), <fpage>31</fpage>&#x2013;<lpage>41</lpage>. <pub-id pub-id-type="doi">10.1007/bf01532051</pub-id>
</citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Xiao</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Numerical interpretation of molecular surface field in dielectric modeling of solvation</article-title>. <source>J. Comput. Chem.</source> <volume>38</volume> (<issue>14</issue>), <fpage>1057</fpage>&#x2013;<lpage>1070</lpage>. <pub-id pub-id-type="doi">10.1002/jcc.24782</pub-id>
</citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wang</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Han</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Hou</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Pan</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Design, synthesis, and preliminary bioactivity studies of substituted purine hydroxamic acid derivatives as novel histone deacetylase (HDAC) inhibitors</article-title>. <source>MedChemComm</source> <volume>5</volume> (<issue>12</issue>), <fpage>1887</fpage>&#x2013;<lpage>1891</lpage>. <pub-id pub-id-type="doi">10.1039/c4md00203b</pub-id>
</citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>White</surname>
<given-names>D. N. J.</given-names>
</name>
</person-group> (<year>1977</year>). <article-title>The principles and practice of molecular mechanics calculations</article-title>. <source>Comput. Chem.</source> <volume>1</volume> (<issue>3</issue>), <fpage>225</fpage>&#x2013;<lpage>233</lpage>. <pub-id pub-id-type="doi">10.1016/0097-8485(77)85014-6</pub-id>
</citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xie</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>The prediction of public risk perception by internal characteristics and external environment: Machine learning on big data</article-title>. <source>Int. J. Environ. Res. Public Health</source> <volume>19</volume> (<issue>15</issue>), <fpage>9545</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph19159545</pub-id>
</citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Cai</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>Quantitative structure-activity relationship models for genotoxicity prediction based on combination evaluation strategies for toxicological alternative experiments</article-title>. <source>Sci. Rep.</source> <volume>11</volume> (<issue>1</issue>), <fpage>8030</fpage>. <pub-id pub-id-type="doi">10.1038/s41598-021-87035-y</pub-id>
</citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Dai</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Yao</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Prediction model for the water jet falling point in fire extinguishing based on a GA-BP neural network</article-title>. <source>PLoS One</source> <volume>14</volume> (<issue>9</issue>), <fpage>e0221729</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0221729</pub-id>
</citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>&#x17d;uvela</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Liu</surname>
<given-names>J. J.</given-names>
</name>
<name>
<surname>Macur</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Baczek</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Molecular descriptor subset selection in theoretical peptide quantitative structure-retention relationship model development using nature-inspired optimization algorithms</article-title>. <source>Anal. Chem.</source> <volume>87</volume> (<issue>19</issue>), <fpage>9876</fpage>&#x2013;<lpage>9883</lpage>. <pub-id pub-id-type="doi">10.1021/acs.analchem.5b02349</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>