<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Chem.</journal-id>
<journal-title>Frontiers in Chemistry</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Chem.</abbrev-journal-title>
<issn pub-type="epub">2296-2646</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">800370</article-id>
<article-id pub-id-type="doi">10.3389/fchem.2021.800370</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Chemistry</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Design of Organic Electronic Materials With a Goal-Directed Generative Model Powered by Deep Neural Networks and High-Throughput Molecular Simulations</article-title>
<alt-title alt-title-type="left-running-head">Kwak et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">OLED Design by Machine Learning</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Kwak</surname>
<given-names>H. Shaun</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/962263/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>An</surname>
<given-names>Yuling</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Giesen</surname>
<given-names>David J.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Hughes</surname>
<given-names>Thomas F.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Brown</surname>
<given-names>Christopher T.</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1568856/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Leswing</surname>
<given-names>Karl</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Abroshan</surname>
<given-names>Hadi</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1528346/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Halls</surname>
<given-names>Mathew D.</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1240112/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Schr&#xf6;dinger, Inc.</institution>, <addr-line>Portland</addr-line>, <addr-line>OR</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Schr&#xf6;dinger, Inc.</institution>, <addr-line>New York</addr-line>, <addr-line>NY</addr-line>, <country>United&#x20;States</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Schr&#xf6;dinger, Inc.</institution>, <addr-line>San Diego</addr-line>, <addr-line>CA</addr-line>, <country>United&#x20;States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/545003/overview">Javier Carrasco</ext-link>, CIC Energigune, Spain</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1558934/overview">Ross Larsen</ext-link>, National Renewable Energy Laboratory (DOE), United&#x20;States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1562827/overview">Youn-Suk Choi</ext-link>, Samsung Advanced Institute of Technology (SAIT), South Korea</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: H. Shaun Kwak, <email>shaun.kwak@schrodinger.com</email>; Yuling An, <email>yuling.an@schrodinger.com</email>
</corresp>
<fn fn-type="other">
<p>This article was submitted to Physical Chemistry and Chemical Physics, a section of the journal Frontiers in Chemistry</p>
</fn>
</author-notes>
<pub-date pub-type="epub">
<day>17</day>
<month>01</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2021</year>
</pub-date>
<volume>9</volume>
<elocation-id>800370</elocation-id>
<history>
<date date-type="received">
<day>23</day>
<month>10</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>12</month>
<year>2021</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Kwak, An, Giesen, Hughes, Brown, Leswing, Abroshan and Halls.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Kwak, An, Giesen, Hughes, Brown, Leswing, Abroshan and Halls</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>In recent years, generative machine learning approaches have attracted significant attention as an enabling approach for designing novel molecular materials with minimal design bias and thereby realizing more directed design for a specific materials property space. Further, data-driven approaches have emerged as a new tool to accelerate the development of novel organic electronic materials for organic light-emitting diode (OLED) applications. We demonstrate and validate a goal-directed generative machine learning framework based on a recurrent neural network (RNN) deep reinforcement learning approach for the design of hole transporting OLED materials. These large-scale molecular simulations also demonstrate a rapid, cost-effective method to identify new materials in OLEDs while also enabling expansion into many other verticals such as catalyst design, aerospace, life science, and petrochemicals.</p>
</abstract>
<kwd-group>
<kwd>OLED</kwd>
<kwd>recurrent neural network</kwd>
<kwd>generative model</kwd>
<kwd>reinforcement learning</kwd>
<kwd>hole transport</kwd>
<kwd>organic electronics</kwd>
<kwd>molecular simulation</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>We are in a paradigm-changing era in the way scientists develop new materials. The advent of modern virtual screening techniques has benefited from virtually infinite cloud computing resources and then, when combined with modern machine learning techniques, and has demonstrated extraordinary success (<xref ref-type="bibr" rid="B22">G&#xf3;mez-Bombarelli et&#x20;al., 2016</xref>). In recent years it has become recognized that one could rely on computational chemistry to deliver sufficient accuracy to inform industrial materials research (<xref ref-type="bibr" rid="B73">Yarnell et&#x20;al., 2021</xref>). This new paradigm directly results from the latest advances in the theory and methods of atomic-scale chemical simulation and the expanding computational power described previously.</p>
<p>With the emergence of simulation as a technology driver, improved algorithms for artificial intelligence (machine learning), cloud compute resources, and computational capabilities such as GPUs, TPUs, analog, and purpose-directed (AI/ML) chips (<xref ref-type="bibr" rid="B60">Shalf, 2020</xref>) are advancing the utility of simulation capabilities. As a result of these changes, many organizations are expanding their digital transformation efforts (<xref ref-type="bibr" rid="B11">Cheng et&#x20;al., 2021</xref>) to include more efficient data-driven solutions aimed at a significant speed-up in assessing key control variables for the design and commercialization of novel materials (<xref ref-type="bibr" rid="B26">Himanen et&#x20;al., 2019</xref>). With physics-based simulation tools as the foundation, data science helps researchers minimize costly experimental measurements, and computationally intensive simulations (<xref ref-type="bibr" rid="B43">Meredig et&#x20;al., 2014</xref>; <xref ref-type="bibr" rid="B10">Butler et&#x20;al., 2018</xref>) while enabling the utilization of datasets for a more thorough exploration of a materials space (<xref ref-type="bibr" rid="B52">Raccuglia et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B21">Ghiringhelli et&#x20;al., 2017</xref>). With these advantages, there is increased use and need for machine learning methods in conjunction with physics-based simulation for various applications in materials research (<xref ref-type="bibr" rid="B51">Pilania et&#x20;al., 2013</xref>; <xref ref-type="bibr" rid="B6">Bart&#xf3;k et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B36">Liu et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B69">Wei et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B45">Moosavi et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B49">Nisbet et&#x20;al., 2020</xref>; <xref ref-type="bibr" rid="B70">Xie et&#x20;al., 2020</xref>).</p>
<p>Despite this great potential, there remain challenges such as data scarcity, quality, and the inherent complexity of the model-building and validation procedures that pose a significant obstacle in a data-driven discovery framework. These obstacles often pose a threat to the effective use of the cheminformatics approaches in chemical discovery. Recently software packages have automated best practices for creating predictive machine learning models over chemical data, applying regularization, and searching over appropriate model architectures (<xref ref-type="bibr" rid="B14">Dixon et&#x20;al., 2016</xref>). These packages have successfully provided life sciences applications&#x2019; value (<xref ref-type="bibr" rid="B1">Abd El-Karim et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B13">de Oliveira and Katekawa, 2018</xref>; <xref ref-type="bibr" rid="B46">Murahari et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B27">Iwaloye et&#x20;al., 2020</xref>).</p>
<p>The ever-increasing demand for high-performance display technology in consumer electronics drives the design and synthesis of various novel OLED materials, such as charge transporters, hosts, and emitters (<xref ref-type="bibr" rid="B42">Melnyk and Pai, 1990</xref>; <xref ref-type="bibr" rid="B30">Jhulki and Moorthy, 2018</xref>). Optoelectronic properties, such as HOMO, LUMO, hole reorganization energy, and thermal properties, such as glass transition temperature, are key considerations when designing high-performance OLED materials (<xref ref-type="bibr" rid="B9">Buckley, 2013</xref>). Although scientists and engineers have accumulated significant knowledge in synthesizing these materials in the lab over the years, the process of experimentally making and measuring the synthesized structures still requires a considerable amount of effort and&#x20;time.</p>
<p>Atomic-scale simulation has been an essential tool for navigating the enormous chemical space of novel OLED materials (<xref ref-type="bibr" rid="B25">Halls et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B24">Halls et&#x20;al., 2016</xref>). With increasing high-throughput computational capabilities, massive theoretical screening of millions of compounds has become a reality (<xref ref-type="bibr" rid="B41">Matsuzawa et&#x20;al., 2020a</xref>). The ready availability of high-quality computational data generated from simulations is proving to be a gold mine for data-driven prediction of material properties, thereby realizing a significant speed-up in assessing key control variables for designing novel materials.</p>
<p>Although there are several ways to generate ideas for new compounds <italic>in silico</italic>, such as exhaustive R-group enumeration, core hopping, and early structure-based <italic>de novo</italic> design algorithms (<xref ref-type="bibr" rid="B25">Halls et&#x20;al., 2015</xref>), they share many common limitations. One of the most prominent is that generated compounds often do not have the desired properties, including activity, operational stability, and many others depending on the application area despite the intended optimization within the chemical design space. Recent successes with recurrent neural networks (RNN) on SMILES representations of molecules generating predicted activities against dopamine receptor Type 2 (<xref ref-type="bibr" rid="B55">Schneider and Fechner, 2005</xref>) have pointed to a new path for molecular <italic>de novo</italic> design targeting specific properties.</p>
<p>In this work, we report a new materials discovery framework powered by the combination of high-throughput quantum chemical simulations and RNN-based generative machine learning techniques designed to explore the chemical space of hole-transporting materials for optimal properties. Successful demonstration of a goal-directed machine learning approach for the case study is realized by uncovering novel materials chemistry satisfying the design criteria.</p>
</sec>
<sec id="s2">
<title>Methods and Principles</title>
<sec id="s2-1">
<title>Goal-Directed Generative Machine Learning</title>
<p>We built a goal-directed generative model using the REINVENT (<xref ref-type="bibr" rid="B50">Olivecrona et&#x20;al., 2017</xref>) protocol, which has shown success in drug discovery applications (<xref ref-type="bibr" rid="B20">Ghanakota et&#x20;al., 2020</xref>) by generating tens of thousands of unique structures with targeted properties while only requiring a few hours of computing time. The deep reinforcement learning methodology applied in the REINVENT protocol is a robust solution for chemical enumeration while not consuming a prohibitive amount of computation cost (<xref ref-type="bibr" rid="B50">Olivecrona et&#x20;al., 2017</xref>; <xref ref-type="bibr" rid="B20">Ghanakota et&#x20;al., 2020</xref>).</p>
<p>The general schematics of the goal-directed generative model in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref> describes a protocol of two individual stages. The first stage trains a prior network from an extensive collection of structures in the chemical space of interest. The second stage shifts the distribution based on a utility function, encoding the desired property ranges. In previous studies, we trained the REINVENT algorithm with a group of structures generated by the PathFinder algorithm (<xref ref-type="bibr" rid="B20">Ghanakota et&#x20;al., 2020</xref>). This work aims to use a design space for REINVENT to cover organic electronics, represented by the popular structural motifs shared among successful hole transport materials.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Schematic representation of the goal-directed generative model for materials discovery.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g001.tif"/>
</fig>
<p>Hole transport materials cannot be successfully designed based on a single design parameter. Most material designs require consideration of multiple parameters that may or may not be coupled to each other by a complicated network of trade-offs. We developed a multiparameter optimization (MPO) scoring function to cope with design principles. Four critical hole transport performance parameters were selected and used to construct the property space, namely two molecular orbital energies (HOMO and LUMO) that define the band offset of the hole transport layer, hole reorganization energy that dictates charge carrier (i.e.,&#x20;hole) mobility, and glass transition temperature (<italic>T</italic>
<sub>
<italic>g</italic>
</sub>) that determines morphological stability. The property space was projected to a single MPO score and used as the utility function for the REINVENT algorithm generating new chemical structures described in <xref ref-type="fig" rid="F1">Figure&#x20;1</xref>.</p>
</sec>
<sec id="s2-2">
<title>Chemistry by Neural Network</title>
<p>As demonstrated in previous drug discovery work (<xref ref-type="bibr" rid="B50">Olivecrona et&#x20;al., 2017</xref>), the prior network provides a mechanism to create new chemical structures powered by a deep neural network. A training set library defines the chemical design space. Still, it is crucial to recognize that one cannot simply reuse a prior network explicitly used for drug design (e.g., ChEMBL database). An entirely new training set that resembles more of the chemical space for a target material must be used, such as the one needed in this&#x20;work.</p>
<p>We collected two groups of chemical structures composed of cores, and R-groups, to assemble the common structural motifs of known hole transport materials for building a prior network. R-groups are defined by the chemical substructures observed frequently on the structural periphery of known hole transport materials, and each is given a single attachment as a connection point to a core. The core and R-group setup can provide an extensive chemical library base through simple structural enumeration while preserving the chemical space of designers&#x2019; interest. The symmetric enumeration scheme also adds the resulting chemical structures with high symmetry, translating into better operational stability and, to a certain degree, and enhanced synthetic viability for the resulting design space (<xref ref-type="bibr" rid="B68">Vor&#x161;il&#xe1;k et&#x20;al., 2020</xref>).</p>
<p>We manually selected thirty-eight unique cores (<xref ref-type="fig" rid="F2">Figure&#x20;2</xref>) from frequently appearing fragments in known hole transport materials published in commercial catalogs and literature (<xref ref-type="bibr" rid="B59">Shahnawaz et&#x20;al., 2019</xref>). We enumerated the structural R-groups with a genetic algorithm featured in the Materials Science Suite as a goal-directed chemical design solution (<xref ref-type="bibr" rid="B57">Schr&#xf6;dinger, 2021</xref>; <xref ref-type="bibr" rid="B28">Jennings et&#x20;al., 2019</xref>), starting from a group of similarly found fragments reported in the hole transport materials literature. The same genetic optimization tool implemented in this work has already found utility for designing new molecular materials for battery technology (<xref ref-type="bibr" rid="B47">Murdock et&#x20;al., 2015</xref>). We used the genetic algorithm as a library generation tool without explicit goals to generate 53,808 unique R-groups defined in the organic electronics space. The unique R-group set used in this work to build the training set for the prior network is available from files provided with the supporting information.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>Thirty-eight unique core structures curated from a known group of hole transport materials as the basis of the training set for building a prior network. Attachment points for R-group enumeration are marked with I.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g002.tif"/>
</fig>
<p>The Materials Science Suite (<xref ref-type="bibr" rid="B57">Schr&#xf6;dinger, 2021</xref>) enumerated R-groups based on the core and R-group libraries. The structural enumeration steps provide symmetrically equivalent groups of substitution points that will always get the same R-group, while each of the R-groups can be substituted independently. Based on the principles of structural enumeration, over 2 million structures were generated and used for training the prior network.</p>
</sec>
<sec id="s2-3">
<title>High-Throughput Quantum Chemistry</title>
<p>Once a prior network defines the chemical design space, the next step is to build a training set for the scorer network of the generative model. The role of the scorer network is to provide the context of structure-property relationships to the model, so the machine can accurately differentiate useful chemistry from less-useful chemistry. Training the scorer network requires a property space paired with the chemical space. This building process is similar to a conventional quantitative structure-property relationships (QSPR) model. It is difficult to find or generate a large amount of reliable data, and consequently, this data scarcity is a challenge when building an accurate machine learning&#x20;model.</p>
<p>One of the emerging trends in overcoming the data scarcity problem in chemical machine learning models is to utilize physics-based theoretical predictions of the material&#x2019;s properties as a virtual training set. These simulations are now possible because of recent improvements in predictive accuracy and that one can cost-effectively access such predictions at a large scale. A recent example of organic semiconductor design (<xref ref-type="bibr" rid="B40">Matsuzawa et&#x20;al., 2020b</xref>) demonstrates how the state-of-the-art physics-based simulation technology powered by a large-scale computing environment accessible to the scientific community can be utilized to produce a large number of reliable materials databases for the development of new materials. The automated large-scale quantum chemical and machine learning predictive schemes used in work are designed to utilize a similar strategy in developing new organic electronic materials.</p>
<p>Using a diversity selection method (<xref ref-type="bibr" rid="B4">An et&#x20;al., 2012</xref>) featured in Schr&#xf6;dinger&#x2019;s MS Informatics package, 265 representative structures were selected from each of the 38 cores, resulting in a total of 10,070 structures. We ran geometry optimization of all 10,070 structures with the same parameters to calculate orbital and reorganization energies. Any compounds that have failed to produce a converged low-energy geometry were removed from the list, leaving 8,627 compounds to be selected and used as the training set for the scorer model. The Materials Science Suite optoelectronics workflow module was used to compute orbital energies (for HOMO and LUMO) and hole reorganization energies of the training set compounds. The raw orbital energies computed from density functional calculations are rarely comparable to the ones obtained from the experiment. This is because the experimental orbital energies are often derived from measured redox potentials using the following expressions to assess the difference between the electrode energy and the redox potentials:<disp-formula id="e1">
<mml:math id="m1">
<mml:mrow>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mrow>
<mml:mtext>Abs</mml:mtext>
<mml:mtext>.&#xa0;Electrode</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:msub>
<mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>&#xa0;E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mtext>NHE</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x2b;</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mrow>
<mml:mtext>Electrode</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(1)</label>
</disp-formula>
<disp-formula id="e2">
<mml:math id="m2">
<mml:mrow>
<mml:msub>
<mml:mtext>E</mml:mtext>
<mml:mrow>
<mml:mtext>HOMO/LUMO</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mrow>
<mml:mtext>Abs</mml:mtext>
<mml:mtext>.&#xa0;Electrode</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>-</mml:mo>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mrow>
<mml:mtext>Oxidation/Reduction</mml:mtext>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(2)</label>
</disp-formula>
</p>
<p>Shukla and coworkers (<xref ref-type="bibr" rid="B64">Shukla et&#x20;al., 2009</xref>) and Kondakova and coworkers (<xref ref-type="bibr" rid="B32">Kondakova et&#x20;al., 2008</xref>) suggested that a relatively inexpensive level of theory and basis set (B3LYP/MIDI!) combined with empirical corrections from molecular density functional calculations can generate the orbital energies (Koopman redox potentials) that are more comparable to the experimental measurements. We apply the empirical corrections to produce the Koopman redox potentials from the raw density functional orbital energies as follows:<disp-formula id="e3">
<mml:math id="m3">
<mml:mrow>
<mml:msub>
<mml:mtext>V</mml:mtext>
<mml:mrow>
<mml:mtext>Oxidation</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>-</mml:mo>
<mml:mn>17</mml:mn>
<mml:mtext>.</mml:mtext>
<mml:mn>50</mml:mn>
<mml:mo>&#x22c5;</mml:mo>
<mml:msub>
<mml:mtext mathvariant="italic">E</mml:mtext>
<mml:mrow>
<mml:mtext>HOMO,&#xa0;DFT</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mtext>eV</mml:mtext>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>-</mml:mo>
<mml:mn>2</mml:mn>
<mml:mtext>.</mml:mtext>
<mml:mn>17</mml:mn>
</mml:mrow>
</mml:math>
<label>(3)</label>
</disp-formula>
<disp-formula id="e4">
<mml:math id="m4">
<mml:mrow>
<mml:msub>
<mml:mi>V</mml:mi>
<mml:mrow>
<mml:mtext>Reduction</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>-</mml:mo>
<mml:mn>22</mml:mn>
<mml:mtext>.</mml:mtext>
<mml:mn>50</mml:mn>
<mml:mo>&#x22c5;</mml:mo>
<mml:msub>
<mml:mi>E</mml:mi>
<mml:mrow>
<mml:mtext>LUMO,&#xa0;DFT</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mtext>eV</mml:mtext>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>-</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mn>3</mml:mn>
<mml:mtext>.</mml:mtext>
<mml:mn>21</mml:mn>
</mml:mrow>
</mml:math>
<label>(4)</label>
</disp-formula>
</p>
<p>These redox potentials are then entered into <xref ref-type="disp-formula" rid="e1">Eqs 1</xref>, <xref ref-type="disp-formula" rid="e2">2</xref> to produce the orbital energy predictions. <italic>E</italic>
<sub>NHE</sub> is the energy of the NHE electrode in water, taken to be &#x2212;4.28&#xa0;V (<xref ref-type="bibr" rid="B67">Truhlar et&#x20;al., 2004</xref>; <xref ref-type="bibr" rid="B32">Kondakova et&#x20;al., 2008</xref>), and <italic>V</italic>
<sub>Electrode</sub> is the potential of the chosen electrode relative to NHE. We used the V<sub>Electrode</sub> of 0.25&#xa0;V in this work, which is the potential relative to the saturated calomel electrode (SCE). This results in the absolute electrode potential (V<sub>Abs. Electrode</sub>) of &#x2212;4.53&#xa0;V. Hole reorganization energies were computed using the following equation:<disp-formula id="e5">
<mml:math id="m5">
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>&#x3bb;&#xa0;</mml:mtext>
</mml:mrow>
<mml:mi>h</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>E</mml:mi>
<mml:msubsup>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">u</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>E</mml:mi>
<mml:msubsup>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">u</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">u</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x2b;</mml:mo>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>E</mml:mi>
<mml:msubsup>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">n</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">u</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>E</mml:mi>
<mml:msubsup>
<mml:mo>&#xa0;</mml:mo>
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">x</mml:mi>
<mml:mi mathvariant="normal">e</mml:mi>
<mml:mi mathvariant="normal">d</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mo>&#xa0;</mml:mo>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="normal">c</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">o</mml:mi>
<mml:mi mathvariant="normal">n</mml:mi>
</mml:mrow>
</mml:msubsup>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(5)</label>
</disp-formula>
</p>
<p>The reorganization calculations were performed at the same level of theory without further empirical corrections, which provides accurate predictions in the hole transport materials space based on a previous study (<xref ref-type="bibr" rid="B17">Evans et&#x20;al., 2016</xref>).</p>
<p>Owing to the computational cost of predicting glass transition temperatures (<italic>T</italic>
<sub>
<italic>g</italic>
</sub>) using physics-based simulations (<xref ref-type="bibr" rid="B2">Afzal et&#x20;al., 2021</xref>), we opted to use a QSPR model instead. The QSPR model was trained to predict <italic>T</italic>
<sub>
<italic>g</italic>
</sub> based on 250 known OLED materials from the literature (<xref ref-type="bibr" rid="B48">Naito and Miura, 1993</xref>; <xref ref-type="bibr" rid="B18">Fujikawa et&#x20;al., 2000</xref>; <xref ref-type="bibr" rid="B63">Shirota, 2000</xref>; <xref ref-type="bibr" rid="B74">Yin et&#x20;al., 2003</xref>; <xref ref-type="bibr" rid="B31">Kimura et&#x20;al., 2005</xref>; <xref ref-type="bibr" rid="B71">Xu and Chen, 2005</xref>; <xref ref-type="bibr" rid="B19">Gao et&#x20;al., 2007</xref>; <xref ref-type="bibr" rid="B62">Shirota and Kageyama, 2007</xref>). A Kernel-based Partial Least Squares (KPLS) method (<xref ref-type="bibr" rid="B5">An et&#x20;al., 2013</xref>) was used to build a predictive model that results in an R<sup>2</sup> for the training set compounds of 0.87 and that for the test set compounds of 0.86. A training-set to a test-set ratio of 4:1 was used to assess the model&#x2019;s accuracy to unknown chemistry. <xref ref-type="fig" rid="F3">Figure&#x20;3</xref> shows the comparison between the QSPR predicted and experimentally measured <italic>T</italic>
<sub>
<italic>g</italic>
</sub> of the 250 OLED compounds used to build the QSPR prediction&#x20;model.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>QSPR model predictions vs experiment for the glass transition temperature (T<sub>g</sub>) of the 250 OLED compounds used to build the T<sub>g</sub> prediction model. Filled squares represent the training set data, and empty squares represent the test set&#x20;data.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g003.tif"/>
</fig>
</sec>
<sec id="s2-4">
<title>Multiparameter Optimization</title>
<p>Multiparameter optimization, often referred to as MPO, provides a measure to assess the logistic transformation function for each constituent property. The MPO scheme used in this work translates each property data to a dimensionless scale between 0 and 1. The MPO scores are set up so that the compound would score below 0.2 if it is bad, between 0.2 and 0.8 if it is ok, and above 0.8 if it is good, and based on the user-specified criteria. The MPO score itself is continuous as defined by the curve for any given set of properties that consist of the multiparameter space. The first step to convert a set of individual properties into a single MPO score is to normalize each individual property into a dimensionless score that ranges from zero to one. We define this normalized score as the desirability score. Conversion from the individual properties to the desirability score is done using a logistic function, whose shape can be further tuned by defining fixed boundaries between bad and good values. In each property space, we define a specific logistic function f(<italic>x</italic>) for the property <italic>x</italic>. This is done by constraining the value of f(<italic>x</italic>) as 0.2 at the boundary between ok and bad values for <italic>x</italic>, and as 0.8 at the boundary between good and ok values for <italic>x</italic>. These points correspond to the inflection points on the logistic function curve, as shown in <xref ref-type="fig" rid="F4">Figure&#x20;4</xref>. With these constraints, one can solve the logistic function written as below for a and b for each property space:<disp-formula id="e6">
<mml:math id="m6">
<mml:mrow>
<mml:mi>f</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mi>x</mml:mi>
<mml:mo>)</mml:mo>
</mml:mrow>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mrow>
<mml:mn>1</mml:mn>
<mml:mo>&#x2b;</mml:mo>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mrow>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>b</mml:mi>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mi>x</mml:mi>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>a</mml:mi>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:msup>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(6)</label>
</disp-formula>
</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Desirability score setups for the multiparameter optimization scoring of hole transport materials. HOMO energy (upper left) is set up with the &#x201c;middle good&#x201d; mode, hole reorganization energy (lower left) is set up with the &#x201c;lower better&#x201d; mode, and both LUMO energy (upper right) and glass transition temperature (lower right) are set with the &#x201c;higher the better&#x201d;&#x20;mode.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g004.tif"/>
</fig>
<p>If the property needs to be maximized (identified as a &#x201c;higher better&#x201d; mode with b &#x3e; 0) or to be minimized (identified as a &#x201c;lower better&#x201d; mode with b &#x3c; 0), a single logistic function can be used to set up the desirability score per property space. If the target property is sandwiched between the less-desired property domains (identified as a &#x201c;middle good&#x201d; mode), we break down the property space into two spaces and solve for the two logistic functions&#x2014;&#x201c;higher better&#x201d; mode on the left and &#x201c;lower better&#x201d; mode on the right&#x2014;that are facing each other in line symmetry at the target property. Once the logistic function f(<italic>x</italic>) is solved for each property space, f(<italic>x</italic>) becomes the desirability score for a compound that has the property <italic>x</italic>. The MPO score is then generated by taking the geometric mean of the desirability scores.<disp-formula id="e7">
<mml:math id="m7">
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mrow>
<mml:mo>(</mml:mo>
<mml:mrow>
<mml:mo>&#xa0;</mml:mo>
<mml:munderover>
<mml:mstyle displaystyle="true">
<mml:mo>&#x220f;</mml:mo>
</mml:mstyle>
<mml:mrow>
<mml:mi>i</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:munderover>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mi>i</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mo>)</mml:mo>
</mml:mrow>
</mml:mrow>
<mml:mrow>
<mml:mfrac>
<mml:mn>1</mml:mn>
<mml:mi>n</mml:mi>
</mml:mfrac>
</mml:mrow>
</mml:msup>
<mml:mo>&#x3d;</mml:mo>
<mml:mroot>
<mml:mrow>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mn>1</mml:mn>
</mml:msub>
<mml:mo>&#x22c5;</mml:mo>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mn>2</mml:mn>
</mml:msub>
<mml:mo>&#x22ef;</mml:mo>
<mml:msub>
<mml:mi>a</mml:mi>
<mml:mi>n</mml:mi>
</mml:msub>
</mml:mrow>
<mml:mi>n</mml:mi>
</mml:mroot>
</mml:mrow>
</mml:math>
<label>(7)</label>
</disp-formula>
</p>
<p>Here, <italic>a</italic>
<sub>i</sub> is an individual desirability score for the <italic>i</italic>-th property of a compound, and <italic>n</italic> is the number of individual properties that get combined to produce a single MPO score, where <italic>n</italic>&#x20;&#x3d; 4 in this work. The MPO scoring scheme was integrated as part of the multiparameter optimization solution of LiveDesign (<xref ref-type="bibr" rid="B37">LiveDesign, 2021</xref>) for automation. We note that the geometric mean is used in this work to produce MPO scores instead of the arithmetic mean because the arithmetic mean could cause a dramatic shift in the MPO score by just one of the target properties being an outlier. This could be detrimental to the quality of the generative model, as a single property labeled as bad can disqualify the compound regardless of how high it scores on other properties.</p>
<p>
<xref ref-type="fig" rid="F4">Figure&#x20;4</xref> summarizes how the desirability scores for each of the four hole transport materials properties examined in this work were set with target values and cutoffs. HOMO energy scores were defined such that a maximum score in the &#x201c;middle good&#x201d; mode would be for a target property of &#x2212;5.5&#xa0;eV. Deviations from this target value by 0.5 and 1.5&#xa0;eV were set as the boundaries between good/ok and ok/bad regions, respectively. LUMO energy scores were set with the &#x201c;higher better&#x201d; mode to be a maximum value of &#x2212;3.0&#xa0;eV set as good while below &#x2212;4.0&#xa0;eV was set as bad. Hole reorganization energy scores were set with the &#x201c;lower better&#x201d; mode to minimize the value. We observed known hole transport materials with high charge mobilities with a hole reorganization energy less than 0.3&#xa0;eV (<xref ref-type="bibr" rid="B17">Evans et&#x20;al., 2016</xref>); thus, compounds with reorganization energy below 0.2&#xa0;eV were defined as good while those above 0.4&#xa0;eV were defined as bad. The score was set for the glass transition temperature relative to a &#x201c;higher better&#x201d; mode that maximizes <italic>T</italic>
<sub>
<italic>g</italic>
</sub>. The upper and lower boundaries between good/ok and ok/bad were set as 140&#xb0;, 110&#xb0;C, respectively.</p>
</sec>
</sec>
<sec id="s3">
<title>Design by Generative Model</title>
<p>The prior network from the generative model created more than 20 million chemical structures over 40&#xa0;h of model generation on a single general-purpose GPU card (NVIDIA GeForce GTX 1080). REINVENT also generated 56,290 unique chemical structures when optimizing for MPO score. Further inspection of the generated structures indicates that 93.2% (52,469) of the structures are predicted to have an MPO score of 0.8 or higher. Such high scores on the chemical structures from the generative model provide direct measures for the model performance. Using the diversity selection algorithm featured in Canvas, 2,477 representative candidates out of the 50&#xa0;K &#x2b; structures were further selected for validation. In this work, the group of candidates was used both as the validation set for the MPO score and as the representative design pool for the new hole transport materials. The newly generated chemical compounds from the generative model were predicted with an MPO score higher than 0.8 (56,290). The validation set selected from the diversity selection (2,477) is provided in the supporting information.</p>
<sec id="s3-1">
<title>Validation in Property Space</title>
<p>We assessed the accuracy of the structure-property relationships predicted by the generative model&#x2019;s MPO score for the validation set of 2,477 candidate compounds. MPO scores estimated for the validation set compounds were compared to the properties (i.e.,&#x20;orbital energies and hole reorganization energy by quantum chemical calculations and <italic>T</italic>
<sub>
<italic>g</italic>
</sub> from QSPR predictions) of the 8,627 training set compounds used to build the scorer network. A comparison of the distributions of MPO scores between the training set for the scorer network and the validation set created by the generative model is shown in <xref ref-type="fig" rid="F5">Figure&#x20;5</xref>. It is clear, as shown in the figure, that the agent network from the generative model is fully capable of generating a large number of chemical structures that exceed property scores compared to the chemical structures used as the starting&#x20;point.</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption>
<p>MPO score distribution (histogram) of the training set for the scorer network (blue) and the validation set generated by the generative model (red).</p>
</caption>
<graphic xlink:href="fchem-09-800370-g005.tif"/>
</fig>
<p>We note the MPO scores shown in the figure for the validation set are not the scores produced by the agent network from the generative model as part of the model predictions. Instead, the MPO scores were individually recomputed based on the properties of each compound through quantum chemical calculations (for the orbital energies and the reorganization energy) and QSPR predictions (<italic>T</italic>
<sub>g</sub>). We find that nearly 84% of the remaining validation set compounds (2,088) score greater than or equal to 0.8 on the MPO score after the reevaluation of the individual properties. The MPO score of 0.8 in this work is designed to be the indicator that differentiates a good design from a bad design, and the number of compounds among the validation set with the MPO score greater than 0.8 would provide the predictive measure of the structure-property relationship model used within the generative model itself.</p>
<p>The results presented in the MPO score distribution indicate that a generative model can design new chemistry while significantly pushing the property profile into the desired MPO score range of 0.92 as compared to the property space from the training set where the MPO score is almost evenly distributed between 0 and&#x20;1.</p>
<p>We compared the individual design properties between the training set chemistry and the generative model chemistry, see <xref ref-type="fig" rid="F6">Figure&#x20;6</xref>. Comparisons of the percentages within the target space between the training set and the validation set chemistry are summarized in <xref ref-type="table" rid="T1">Table&#x20;1</xref>. Overall, we found that individual properties and MPO scores are generally in the expected target property range. Further analysis revealed two different types of variation in the property space derived from the generated chemistry model. The first type is where the newly developed chemistry becomes enriched in a property space corresponding to the more desirable hole reorganization energy and the LUMO energy.</p>
<fig id="F6" position="float">
<label>FIGURE 6</label>
<caption>
<p>Comparisons between the training set chemistry (blue) and the chemistry created by the generative model (red) over the four individual design properties considered in this work - hole reorganization energy (upper left), HOMO energy (upper right), LUMO energy (lower left), and glass transition temperature (lower right).</p>
</caption>
<graphic xlink:href="fchem-09-800370-g006.tif"/>
</fig>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Percentages of chemical compounds from the training set and the validation set generative chemistry model bound within the target&#x20;space.</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Property</th>
<th align="center">MPO</th>
<th align="center">
<italic>E</italic>
<sub>HOMO</sub> (eV)</th>
<th align="center">
<italic>E</italic>
<sub>LUMO</sub> (eV)</th>
<th align="center">
<italic>&#x3bb;</italic>
<sub>
<italic>h</italic>
</sub> (eV)</th>
<th align="center">
<italic>T</italic>
<sub>
<italic>g</italic>
</sub> (&#xb0;C)</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Target interval space</td>
<td align="char" char=".">[0.8, 1]</td>
<td align="char" char=".">[&#x2212;5.7, &#x2212;5.3]</td>
<td align="char" char=".">[&#x2212;3.0, 0.0]</td>
<td align="char" char=".">[0.0, 0.2]</td>
<td align="center">[140, &#x221e;]</td>
</tr>
<tr>
<td align="left">% in training set chemistry</td>
<td align="char" char=".">16.1</td>
<td align="char" char=".">32.3</td>
<td align="char" char=".">59.0</td>
<td align="char" char=".">36.9</td>
<td align="char" char=".">23.0</td>
</tr>
<tr>
<td align="left">% in design by generative model</td>
<td align="char" char=".">84.1</td>
<td align="char" char=".">86.1</td>
<td align="char" char=".">55.4</td>
<td align="char" char=".">70.9</td>
<td align="char" char=".">95.5</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>In contrast, a significant reduction in the population of less-desired properties is observed. There is an enrichment in the desired property space marked with an improved distribution corresponding to ideal HOMO energy and glass transition temperatures in this second grouping.</p>
<p>For the hole reorganization energy, most of the validation set chemistry from the generative model shares a hole reorganization energy below 0.2&#xa0;eV. The training set chemistry was constructed with substructures from known OLED chemistry. Consequently, the hole reorganization energies were already well regulated in the training set space. As such, there was little need to drive down the average value for the reorganization energy for the newly generated chemistry. Instead, it is more desirable to minimize the number of compounds generated with the reorganization energies that are much higher than the mode of the distribution. This is indeed the observed trend from the newly generated chemistry in <xref ref-type="fig" rid="F6">Figure&#x20;6</xref>.</p>
<p>Orbital energies show signs of improvement from the generative model by delivering an enriched LUMO energy and favorable shift of the HOMO energy. However, a couple of observations cannot be simply addressed as improvements in the property space. The HOMO energy, for example, of the validation set lies close to the target property, and it shows a bimodal distribution with fewer centered at the desired value of &#x2212;5.5&#xa0;eV versus the two modes centered around &#x2212;5.56&#xa0;eV and &#x2212;5.32&#xa0;eV. In the LUMO case, the generative model does not seem able to push the LUMO energy much higher than the starting point. Instead, it can be seen from the summary in <xref ref-type="table" rid="T1">Table&#x20;1</xref> that the generative model returns a reduced number of compounds from the target property&#x20;space.</p>
<p>This performance indicates a specific limitation, and hence, requires a close inspection of the generative model by the user. In this case, a generative model scheme improved molecular electronic property prediction. However, it is essential to note that some property subspaces may be inherently unapproachable by an initially defined and trained prior network. Again, a close inspection by the user of each property is required before assessing the model&#x2019;s validity. Further, while LUMO energy space did not seem to show as impressive an improvement as other property space, the starting point for LUMO energy already had the highest percentage of structures in the training set (59%) that meet the design criteria. As such, maintaining the equivalent ratio of chemistry that meets the criteria while simultaneously satisfying other critical design criteria, and retaining a high MPO score, was still deemed a significant success.</p>
<p>The glass transition temperature can illustrate the most straightforward improvement among the individual target properties that drive the generative model. The validation chemistry from the generative model pushes the average <italic>T</italic>
<sub>
<italic>g</italic>
</sub> towards the upper-bound of the starting distribution from the training set while resulting in a significant shift of the average <italic>T</italic>
<sub>
<italic>g</italic>
</sub> expected from the materials by nearly 60&#xb0;C, with over 95% of the new materials designed by the model satisfying the property target (<italic>T</italic>
<sub>
<italic>g</italic>
</sub> &#x3e; 140&#xb0;C).</p>
</sec>
<sec id="s3-2">
<title>Validation in Chemical Design Space</title>
<p>One advantage of using recurrent neural networks in combination with reinforcement learning for a generative chemistry model (<xref ref-type="bibr" rid="B50">Olivecrona et&#x20;al., 2017</xref>) is the ability to generate valid chemical structures with a much higher success rate than traditional methods such as variational autoencoder algorithms (<xref ref-type="bibr" rid="B3">Alperstein et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B29">Jewell et&#x20;al., 2021</xref>). For example, the convolutional variational autoencoder (CVAE) has been widely known among the drug discovery community as a fast and efficient tool to generate new molecular structures. Yet, the approach is often challenged by the low success rate in generating valid chemical structures, let&#x20;alone ones with the desired properties (<xref ref-type="bibr" rid="B35">Lim et&#x20;al., 2018</xref>). On the other hand, we confirmed that over 80% of the two million-plus SMILES strings generated by the prior network in this work were valid chemical structures, and rendering the rate of developing valid chemistry a non-issue for this framework. Optimization in the property space has also proven more successful with the RNN based generative design, as reported in benchmark studies (<xref ref-type="bibr" rid="B8">Brown et&#x20;al., 2019</xref>; <xref ref-type="bibr" rid="B39">Marques et&#x20;al., 2021</xref>).</p>
<p>As the first step to understanding the design space, we examined the overall similarity between the chemical structures from the training set for the scorer network and the validation set generated by the model. Similarities between chemical structures were quantified by a Tanimoto distance metric that is a normalized measure of the similarity in descriptor space between two molecules:<disp-formula id="e8">
<mml:math id="m8">
<mml:mrow>
<mml:mi mathvariant="normal">S</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">m</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">l</mml:mi>
<mml:mi mathvariant="normal">a</mml:mi>
<mml:mi mathvariant="normal">r</mml:mi>
<mml:mi mathvariant="normal">i</mml:mi>
<mml:mi mathvariant="normal">t</mml:mi>
<mml:mi mathvariant="normal">y</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
</mml:munder>
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>B</mml:mi>
</mml:msubsup>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>A</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
</mml:munder>
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>A</mml:mi>
</mml:msubsup>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>A</mml:mi>
</mml:msubsup>
<mml:mo>&#x2b;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
</mml:munder>
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>B</mml:mi>
</mml:msubsup>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>B</mml:mi>
</mml:msubsup>
<mml:mo>&#x2212;</mml:mo>
<mml:mstyle displaystyle="true">
<mml:munder>
<mml:mo>&#x2211;</mml:mo>
<mml:mi>i</mml:mi>
</mml:munder>
<mml:mrow>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>B</mml:mi>
</mml:msubsup>
<mml:msubsup>
<mml:mi>x</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>A</mml:mi>
</mml:msubsup>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mstyle>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
<label>(8)</label>
</disp-formula>where <italic>A</italic> and <italic>B</italic> are indicators for two different molecules in comparison (with <italic>A</italic> being the reference molecule). In this work, we use extended-connectivity fingerprints from RDKit (<xref ref-type="bibr" rid="B53">Rogers and Hahn, 2010</xref>) as the descriptor space for estimating the similarities, and as such, <italic>i</italic> denotes an index for the fingerprint bit. The similarity value per pair of molecules lies between one and zero based on the definition. One indicates identical molecules, while zero indicates a complete dissimilarity. The primary purpose of the analysis is to assess the novelty of the design space quantitatively. In an ideal scenario, the candidate materials space created by the generative model would be 1) close enough to the training set space to retain the original design space characteristics (<italic>e.g.</italic>, organic compounds with a resemblance to hole transport materials) and 2) far enough from the training set space to have an improved set of properties as predicted by the machine learning algorithms.</p>
<p>Five hundred top-ranked structures were selected based on the MPO score from the newly generated structures in the generative model. Then, for each of the structures, a new chemical structure with the highest Tanimoto similarity was selected based on its MPO score:<disp-formula id="e9">
<mml:math id="m9">
<mml:mrow>
<mml:mi>&#x394;</mml:mi>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:msub>
<mml:mi>O</mml:mi>
<mml:mi>G</mml:mi>
</mml:msub>
<mml:mo>&#x2212;</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:msub>
<mml:mi>O</mml:mi>
<mml:mi>S</mml:mi>
</mml:msub>
</mml:mrow>
</mml:math>
<label>(9)</label>
</disp-formula>where,<disp-formula id="e10">
<mml:math id="m10">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:msub>
<mml:mi>O</mml:mi>
<mml:mi>G</mml:mi>
</mml:msub>
<mml:mo>&#x3d;</mml:mo>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mi>n</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>w</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>y</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>v</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>d</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>l</mml:mi>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(10)</label>
</disp-formula>
<disp-formula id="e11">
<mml:math id="m11">
<mml:mrow>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:msub>
<mml:mi>O</mml:mi>
<mml:mi>S</mml:mi>
</mml:msub>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mo>&#x3d;</mml:mo>
<mml:mtext>&#xa0;</mml:mtext>
<mml:mi>M</mml:mi>
<mml:mi>P</mml:mi>
<mml:mi>O</mml:mi>
<mml:mrow>
<mml:mo>{</mml:mo>
<mml:mrow>
<mml:mi>c</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>b</mml:mi>
<mml:mi>l</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>f</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>h</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>t</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>i</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>g</mml:mi>
<mml:mi>s</mml:mi>
<mml:mi>e</mml:mi>
<mml:mi>t</mml:mi>
</mml:mrow>
<mml:mo>}</mml:mo>
</mml:mrow>
</mml:mrow>
</mml:math>
<label>(11)</label>
</disp-formula>
</p>
<p>Note that &#x2206;MPO &#x3e;0 indicates improved properties with the new design but an &#x2206;MPO &#x3c;0 is a decline in the design properties. <xref ref-type="fig" rid="F7">Figure&#x20;7A</xref> summarizes the difference in MPO scores for all 500 pairs of structures picked from the top-ranked validation set compounds and the corresponding (closest-resembling) training set compounds. <xref ref-type="fig" rid="F7">Figure&#x20;7B</xref> also shows the distribution of the MPO score difference by a histogram.</p>
<fig id="F7" position="float">
<label>FIGURE 7</label>
<caption>
<p>
<bold>(A)</bold> Similarity vs &#x2206;MPO of the top-500-ranked new designs by MPO score and <bold>(B)</bold> the distribution of &#x2206;MPO shown as a histogram with a dashed line marking the point of no improvement (i.e.,&#x20;&#x2206;MPO &#x3d; 0). Each data point from <bold>(A)</bold> is drawn with a circle whose size scales to the MPO score of the newly designed target.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g007.tif"/>
</fig>
<p>Most of the structure pairs shown in the plot mark a similarity score greater than 0.50 on the <italic>x</italic>-axis, confirming a solid resemblance between the newly generated structures and the starting space for those designs. The next thing to notice is that most of the data points (461 out of 500, or 92.2%) shown in <xref ref-type="fig" rid="F7">Figure&#x20;7</xref> lie above the line &#x2206;MPO &#x3d; 0, implying the improvement of the target properties over the closest representations from the training set space. The maximum &#x2206;MPO is around 0.5, while the minimum &#x2206;MPO score is less than around &#x2212;0.03. So, the extent of improvement is much greater than decline. Its also noteworthy that the most significant improvement in the property space occurred when the similarity between the closest siblings in training and validation sets ranges from 0.55 to&#x20;0.70.</p>
<p>
<xref ref-type="fig" rid="F8">Figure&#x20;8</xref> lists a couple of example pairs selected from the similarity analysis. One derives from the high-scoring machine-generated design, and the other from a training set space where the scorer network resembles the machine-generated design. Inspecting the individual chemical structures generated by the model with high scores, we find many of the structures contain one of the 38 original core chemistries provided as the basis for building the prior network. In <xref ref-type="fig" rid="F8">Figure&#x20;8</xref>, for example, two apparent core structures have driven the generative and training set chemistry models into relatively higher MPO ranges than average. This result is consistent with the general observation that the generative molecular structures are defined by core-fragments found in the training chemistry and the generative molecular structure space. This introduces a constraint on structure diversity in this study but will be the subject of future&#x20;work.</p>
<fig id="F8" position="float">
<label>FIGURE 8</label>
<caption>
<p>Machine-drawn examples created by the generative model (<bold>M1</bold> and <bold>M2</bold>) and their counterparts in the training set space for the scorer network with the highest similarity (<bold>T1</bold> and <bold>T2</bold>) are shown with individual properties and their MPO scores. <bold>(A)</bold> Similarity 0.565, <bold>(B)</bold> Similarity 0.706.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g008.tif"/>
</fig>
<p>We note a unique aspect of the design results in an increase of MPO score by nearly 0.2 while there is no apparent structural correlation between the training and the validation set compounds. In most of these cases, comparing the training set chemistry and the generative model design points to a trend wherein the structural features not shared by the two are often alien to the 38 core structures used to build the prior network. This often leads to a reduced number of symmetry points and, thus, increases the uniqueness of each design. Based on this aspect, newly generated molecular design by the generative model can benefit from the known chemical design space that is proven to work while suggesting new design ideas to push the target property space even further. More specific design strategies to accomplish this will be discussed in the later section in more detail.</p>
<p>One of the desired traits of the generative model for chemistry is to have the capability to extrapolate target properties beyond the range that the training set data provides. While the MPO scoring scheme we used in this work is not designed explicitly to support the capability of extending the score outside the training set domain&#x2014;<italic>i.e.</italic>, by confining them with the definition of the MPO score to be between 0 and 1&#x2014;individual properties are not strictly bound by such constraints and still have the freedom to result in an extrapolation. In fact, we observe in <xref ref-type="fig" rid="F6">Figure&#x20;6</xref> the sign of extrapolation in the glass transition temperature with the newly generated compounds, as the validation set analyzed in this work has 17 compounds with <italic>T</italic>
<sub>
<italic>g</italic>
</sub> greater than the upper limit from the training set (215&#xb0;C). This is supported by the previous study where the REINVENT formalism was used to create the new molecular designs (<xref ref-type="bibr" rid="B39">Marques et&#x20;al., 2021</xref>), reporting the model&#x2019;s general capability of extrapolating outside the training set domain. Based on our observation, we believe the best strategy to bring the extrapolation capability to the generative model is 1) to take advantage of multiparameter optimization, 2) to maximize the number of training set data to provide enough resolution in the property space to extend near the edges of the training set domain, and 3) to have the property prediction model&#x2014;such as quantum chemistry for electronic properties and QSPR for glass transition used in this work&#x2014;available well outside the training set space to keep the accuracy of predicted properties for the validation sets&#x20;high.</p>
</sec>
<sec id="s3-3">
<title>Validation by Chemical Stability</title>
<p>Chemical stability is an essential design for any novel organic electronic material. Bond dissociation energy (BDE) of the weakest bond for a chemical compound is often considered a good predictor of chemical and operational stability. An explicit demonstration for hole transport materials was previously described by Kwon and coworkers and Kondakov and coworkers (<xref ref-type="bibr" rid="B34">Lee et&#x20;al., 2021</xref>). Unfortunately, there is significant difficulty incorporating BDE of the weakest bond into the scoring function for a generative model. First, the cost associated with accurate predictions for all BDEs in a given molecule is prohibitively expensive (i.e.,&#x20;it scales approximately as 3&#xb7;<italic>n</italic> times the cost of orbital energy calculations where <italic>n</italic> is the number of bonds per molecule). Second, the BDE for the weakest bond of an entire molecule is extremely sensitive to the subtle changes in the molecule&#x2019;s chemical structure and conformation. A machine learning approach for prediction is nearly impossible, and further, we note this is a different problem than predicting a single BDE of a particular bond given surrounding chemistry (<xref ref-type="bibr" rid="B66">St. John et&#x20;al., 2020</xref>).</p>
<p>We introduced a post-generative screening stage to refine the machine-generated and model-augmented designs by the weakest BDEs of compounds. This works particularly well with hole transport material design since the training set for the prior network is based on a partially conjugated organic space that is not expected to show the instability typical in other design spaces such as high-energy materials.</p>
<p>For all design examples shown in this work, BDEs of the weakest bond at the ground state (S<sub>0</sub>) and the triplet excited state (T<sub>1</sub>) were computed by quantum chemical simulation using LACV3P&#x2a;&#x2a; basis set and B3LYP functional. Given the environment in which the hole transport layers are often deployed, BDEs of the cationic (<italic>i.e.</italic>, positively charged) and the anionic states (<italic>i.e</italic>., negatively charged) were also computed. For each molecule, the BDE of the weakest bond was determined by calculating BDEs computed for the bonds that can dissociate without involving hydrogen abstraction processes. Each BDE is computed as the energy difference between the homolytic dissociation of a single, acyclic bond from the input molecular compound. For the excited state BDEs, the energy before the bond dissociation was computed at the designated excited state (<italic>i.e.</italic>, S<sub>1</sub> or T<sub>1</sub>), representing the initial state for the bond dissociation process. For the charged state BDEs, one electron was added to (for anionic BDE) or removed from (for cationic BDE) the molecule before and after the bond dissociation. Since one can place the extra charge on either side of the dissociated species, each bond results in two independent BDEs for each charged state. This algorithm was automated to be performed over all input structures for all initial states&#x2014;<italic>i.e.</italic>, neutral, excited, cationic, and anionic. Once the BDEs were computed, they were sorted to identify each state&#x2019;s lowest BDE per compound. The BDE analysis based on the weakest link of each compound ensures the chemical design created or inspired by the generative model meets the minimum requirements of compound stability under the normal operation of the device.</p>
</sec>
</sec>
<sec id="s4">
<title>
<italic>De Novo</italic> Design Strategy and Outlook</title>
<sec id="s4-1">
<title>Design Augmented by the Generative Model</title>
<p>The new chemistry drawn from the generative model provides a methodology for autonomous materials design. While the raw chemistry generated as SMILES strings from the generative model shows a list of interesting molecular structures paired with desired properties, much greater insights can be extracted from the individual design suggestions.</p>
<p>First, the generative model methodology demonstrates a viable approach to autonomous material design by delivering viable hole transport structures. While the diversity of structures in this first stage does not take explicit synthetic difficulty into account, it does, however, and minimize the bias a practicing chemist brings to molecular design. Second, one can more efficiently examine a structural space and ensure it has been thoroughly investigated versus the traditional empirical approaches. Third, the model accurately reflects existing known design rules. For example, successful HTL molecules in the design space minimize lone-pair electrons on heteroatoms that are not sterically hindered (<italic>e.g.,</italic> protected) as they may be susceptible to known degradation paths such as photochemical or cationic-nucleophilic reactions, see <xref ref-type="fig" rid="F8">Figure&#x20;8</xref> (<xref ref-type="bibr" rid="B65">So and Kondakov, 2010</xref>; <xref ref-type="bibr" rid="B54">Schmidbauer et&#x20;al., 2013</xref>).</p>
<p>While these unwanted characteristics can be filtered out in generating new chemistry, this will result in the loss of a significant number of new candidates generated by the model and thus, interfere with the value we get from examining a diverse set. A recommended strategy in the putative workflow is to investigate the representative groups of compounds that share frequently appearing substructure patterns, then apply minor corrections in their design by manual inspection.</p>
<p>
<xref ref-type="fig" rid="F9">Figure&#x20;9</xref> shows select candidates (<bold>D1</bold>, <bold>D2</bold>, and <bold>D3</bold>) derived from structures frequently appearing in the validation set and having high MPO scores while incorporating fewer less-desirable fluorination and alkylation substituents. For example, it has been reported that fluorine substituents on aromatic and heterocyclic ring systems are prone to a variety of chemistries (<italic>e.g.</italic>, homolytic and heterolytic fragmentation or even substitution nucleophilic aromatic (SNAr) reactions with nucleophiles such as pyridyl nitrogen (<xref ref-type="bibr" rid="B38">March 1985</xref>; <xref ref-type="bibr" rid="B61">Shi et&#x20;al., 2015</xref>). Further, alkyl substituents that are para- or ortho-to an <italic>sp3</italic> hybridized nitrogen (triarylamine) are suspected to be sites for chemical degradation through free-radical formation, but this has yet to be proven experimentally. Again, the refined set of structures were (re)validated with relatively high MPO scores (MPO<sub>
<bold>D1</bold>
</sub> &#x3d; 0.78, MPO<sub>
<bold>D2</bold>
</sub> &#x3d; 0.72, and MPO<sub>
<bold>D3</bold>
</sub> &#x3d; 0.95), and then further examined for their chemical stability represented by the dissociation energies of the weakest bond, relative to that of a reference hole transport material, NPB (N,N&#x2032;-Di (1-naphthyl)-N,N&#x2032;-diphenyl-(1,1&#x2032;-biphenyl)-4,4&#x2032;-diamine, and chemical structure shown in <xref ref-type="fig" rid="F9">Figure&#x20;9</xref>), on the different potential energy surfaces reviewed (<italic>e.g.</italic>, ground state, triplet-excited state, cationic, and anionic states), confirm that all structures were valid hole transport material candidates.</p>
<fig id="F9" position="float">
<label>FIGURE 9</label>
<caption>
<p>Bond dissociation energies for the ground state (S<sub>0</sub>), triplet-excited state (T<sub>1</sub>), cationic state, and anionic state, predicted by quantum chemical calculations over three example hole transport material designs derived from the generative model (<bold>D1</bold>, <bold>D2</bold>, and <bold>D3</bold>), and compared to a known hole transport material, NPB (shown on top).</p>
</caption>
<graphic xlink:href="fchem-09-800370-g009.tif"/>
</fig>
<p>Another design rule can be extracted from the generative model by examining the pattern of how the machine draws the new compounds rather than simply accepting computed recommendations. The success of this methodology is evidenced by the similarity analysis summarized in <xref ref-type="fig" rid="F7">Figure&#x20;7</xref>; many chemical motifs from the training set for the prior network reappear in the candidates from the generative&#x20;model.</p>
<p>
<xref ref-type="fig" rid="F10">Figure 10</xref> illustrates how these frequently appearing motifs are identified amongst the candidate compounds generated by the model <xref ref-type="fig" rid="F10">Figures&#x20;10A&#x2013;D</xref>. During the manual inspection of several high-scoring compounds, we found that a particular set of structural patterns appear with higher frequency than others, and such as those marked in the figure with the dotted lines. We identified that these patterns are tied to the design rules that are not as obvious to the human eye and can be used to create another set of more advanced designs that neither human nor machine has considered.</p>
<fig id="F10" position="float">
<label>FIGURE 10</label>
<caption>
<p>Four examples <bold>(A&#x2013;D)</bold> of the high-MPO-scoring compounds from the generative model are accompanied by some of the frequently appearing substructure motifs, marked by the area enclosed within the dotted lines.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g010.tif"/>
</fig>
<p>The advantage of this strategy is that unlike blindly accepting the outcome of the generative model, one could get access to a much clearer logic behind the structure-property relationships. It also presents an opportunity for the materials experts to seamlessly compare their ideas and intuition with the machine model results.</p>
<p>Not surprisingly, most of the frequently appearing substructures are among the fragments found in either the core or the R-group chemistry used to build the prior network. This means the design process relies on concentrating the existing chemical design space on what works best rather than digging up an entirely new chemical space every time. This design approach represents an enrichment of the chemical&#x20;space.</p>
<p>At the same time, the generative model does not systematically inhibit the appearance of a brand-new chemical motif. <xref ref-type="fig" rid="F10">Figure&#x20;10D</xref> is an example of the substructure marked by the dotted line, spiro[acridine-9,9&#x2032;-xanthene] group, which has also appeared in <bold>D3</bold> and had never been introduced as part of the core chemistry used to build the prior network.</p>
<p>Based on the recognized substructure patterns among the high-scoring candidates returned by the generative model, we built a small set following these simple design rules:<list list-type="simple">
<list-item>
<p>(1) Assemble a structure with two or fewer substructures identified from the raw design</p>
</list-item>
<list-item>
<p>(2) Maintain high symmetry for synthetic viability</p>
</list-item>
<list-item>
<p>(3) Use fast QM calculations, including the BDE analysis, and to iterate through&#x20;ideas</p>
</list-item>
</list>
</p>
<p>
<xref ref-type="fig" rid="F11">Figure&#x20;11</xref> lists three of the simplest design examples following these rules. Among the examples shown in the figure, two (<bold>R1</bold> and <bold>R2</bold>) are from simple recombination of the frequently appearing chemical substructures from the generative model, 10-phenyl phenoxazine and 10-phenyl 10H-spiro acridine-9,9&#x2032;-fluorene, respectively. They are based on a primary design principle that combines the same symmetry point at the center (2-fold rotational) and the core chemistry (biphenyl) of NPB. The remaining structure (<bold>R3</bold>) is an extension of a known chemical motif, truxene (<xref ref-type="bibr" rid="B72">Yang et&#x20;al., 2009</xref>; <xref ref-type="bibr" rid="B23">Goubard and Dumur, 2015</xref>; <xref ref-type="bibr" rid="B61">Shi et&#x20;al., 2015</xref>), and with an R-group (isoquinoline) that appears in the machine-drawn candidates with high frequency.</p>
<fig id="F11" position="float">
<label>FIGURE 11</label>
<caption>
<p>Bond dissociation energies for the ground state (S<sub>0</sub>), triplet-excited state (T<sub>1</sub>), cationic state, and anionic state, predicted by quantum chemical calculations over three example hole transport material designs derived from the generative model <bold>(R1, R2, and R3)</bold> derived from the design principle that takes the patterns observed by the generative model as input while coupling them with user directives.</p>
</caption>
<graphic xlink:href="fchem-09-800370-g011.tif"/>
</fig>
<p>The example designs <bold>R1&#x2013;R3</bold> were assessed for their predicted properties in the same manner as previously done (<bold>D1&#x2013;D3</bold>), and the MPO scores for all three remain quite high (MPO<sub>
<bold>R1</bold>
</sub> &#x3d; 0.88, MPO<sub>
<bold>R2</bold>
</sub> &#x3d; 0.97, and MPO<sub>
<bold>R3</bold>
</sub> &#x3d; 0.95). The dissociation energy of the weakest bonds for <bold>R1</bold> and <bold>R2</bold> in the S<sub>0</sub> and T<sub>1</sub> states are predicted to be equal to or lower than those of NPB. <bold>R3</bold> looks to have significantly better chemical stability, given that the BDE from the weakest bond is expected to be higher than the other two by nearly 50&#xa0;kcal/mol for all examined states. BDE of the weakest bonds for the cationic and the anionic surfaces are predicted to be higher than that of NPB, confirming a legitimate design example for novel hole transport materials that can withstand both hole and electron currents. MPO scores and the individual material properties (including the results from BDE analysis) of the six example designs are summarized in <xref ref-type="table" rid="T2">Table&#x20;2</xref> for a quick comparison.</p>
<table-wrap id="T2" position="float">
<label>TABLE 2</label>
<caption>
<p>Summary of MPO, individual design properties, and BDE analysis results for the machine-drawn design examples (<bold>D1&#x2013;D3</bold>) and recombination with frequently appearing structural patterns (<bold>R1&#x2013;R3</bold>).</p>
</caption>
<table>
<thead valign="top">
<tr>
<th rowspan="2" align="left">Design</th>
<th rowspan="2" align="center">MPO</th>
<th rowspan="2" align="center">
<italic>E</italic>
<sub>HOMO</sub> (eV)</th>
<th rowspan="2" align="center">
<italic>E</italic>
<sub>LUMO</sub> (eV)</th>
<th rowspan="2" align="center">
<italic>&#x3bb;</italic>
<sub>
<italic>h</italic>
</sub> (eV)</th>
<th rowspan="2" align="center">
<italic>T</italic>
<sub>
<italic>g</italic>
</sub> (&#xb0;C)</th>
<th colspan="4" align="center">Weakest BDE (kcal/mol)</th>
</tr>
<tr>
<th align="center">
<italic>S</italic>
<sub>
<italic>0</italic>
</sub>
</th>
<th align="center">
<italic>T</italic>
<sub>
<italic>1</italic>
</sub>
</th>
<th align="center">
<italic>Cation</italic>
</th>
<th align="center">
<italic>Anion</italic>
</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">
<bold>D1</bold>
</td>
<td align="char" char=".">0.78</td>
<td align="char" char=".">&#x2212;5.77</td>
<td align="char" char=".">&#x2212;2.75</td>
<td align="char" char=".">0.12</td>
<td align="char" char=".">125</td>
<td align="char" char=".">85.5</td>
<td align="char" char=".">44.4</td>
<td align="char" char=".">108.6</td>
<td align="char" char=".">51.0</td>
</tr>
<tr>
<td align="left">
<bold>D2</bold>
</td>
<td align="char" char=".">0.72</td>
<td align="char" char=".">&#x2212;5.43</td>
<td align="char" char=".">&#x2212;2.44</td>
<td align="char" char=".">0.18</td>
<td align="char" char=".">120</td>
<td align="char" char=".">109.8</td>
<td align="char" char=".">53.1</td>
<td align="char" char=".">130.6</td>
<td align="char" char=".">91.6</td>
</tr>
<tr>
<td align="left">
<bold>D3</bold>
</td>
<td align="char" char=".">0.95</td>
<td align="char" char=".">&#x2212;5.57</td>
<td align="char" char=".">&#x2212;2.61</td>
<td align="char" char=".">0.14</td>
<td align="char" char=".">168</td>
<td align="char" char=".">70.7</td>
<td align="char" char=".">18.5</td>
<td align="char" char=".">78.3</td>
<td align="char" char=".">41.9</td>
</tr>
<tr>
<td align="left">
<bold>R1</bold>
</td>
<td align="char" char=".">0.88</td>
<td align="char" char=".">&#x2212;5.36</td>
<td align="char" char=".">&#x2212;2.49</td>
<td align="char" char=".">0.08</td>
<td align="char" char=".">158</td>
<td align="char" char=".">63.5</td>
<td align="char" char=".">3.8</td>
<td align="char" char=".">78.2</td>
<td align="char" char=".">43.4</td>
</tr>
<tr>
<td align="left">
<bold>R2</bold>
</td>
<td align="char" char=".">0.97</td>
<td align="char" char=".">&#x2212;5.59</td>
<td align="char" char=".">&#x2212;2.42</td>
<td align="char" char=".">0.05</td>
<td align="char" char=".">184</td>
<td align="char" char=".">70.0</td>
<td align="char" char=".">6.1</td>
<td align="char" char=".">81.2</td>
<td align="char" char=".">41.2</td>
</tr>
<tr>
<td align="left">
<bold>R3</bold>
</td>
<td align="char" char=".">0.95</td>
<td align="char" char=".">&#x2212;6.06</td>
<td align="char" char=".">&#x2212;2.60</td>
<td align="char" char=".">0.14</td>
<td align="char" char=".">164</td>
<td align="char" char=".">111.3</td>
<td align="char" char=".">55.3</td>
<td align="char" char=".">130.9</td>
<td align="char" char=".">106.7</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>While the design rules illustrated in this work demonstrate solid pathways to novel organic electronic materials using unbiased, machine-generated information, and these examples also highlight that the human factor cannot be completely isolated. The discontinuity of the structure-property relationship is often quite evident after minor refinement. Still, it may be easily missed by a non-expert. One example of this issue is exemplified with the design of <bold>R1</bold> and <bold>R2</bold>. By following the same design principles (1&#x2013;3) illustrated above, there is no apparent pressure to favor either biphenyl groups or a single phenyl group at the center. However, an experienced OLED expert would immediately note that the biphenyl groups at the center are observed in successful hole transport materials (<italic>e.g.,</italic> NPB, CBP, TPD, and dPVBi, etc.). A quick set of quantum chemical calculations supports the expert&#x2019;s intuition. In this case, the single-phenyl-ring versions of <bold>R1</bold> and <bold>R2</bold> end up with lower bond dissociation energies around the core, especially with near-zero or even negative BDE in the T<sub>1</sub>&#x20;state.</p>
<p>This does not mean a single phenyl ring near the center should be eliminated from design directives. As seen for <bold>D1</bold> and <bold>D2</bold>, the machine found a set of chemical motifs around a single phenyl ring that delivers adequate stability while satisfying critical requirements for hole transport materials. This is an example where the machine can find subtle yet often not-readily-interpretable changes outside the desirable core chemistry, which effectively drive the property space further into the more desired target space, and as shown in <xref ref-type="fig" rid="F8">Figure&#x20;8</xref>. In both cases, the clear benefit of the design augmented by the generative model is that one could form a high-throughput process whereby a machine dispenses unbiased design ideas while human experts constantly filter and refine the list, nudging it in the direction of viable design rules. In other words, the machine becomes an expert tool to accelerate the creation of new design ideas while diversifying the design space in an unbiased manner. But, it is not a replacement for human experts. Instead, it is a tool that augments experts and thus accelerates exploration of a target material&#x20;space.</p>
</sec>
<sec id="s4-2">
<title>Chemistry by Machine: The Next Step</title>
<p>While this work demonstrates the value of using a generative model approach for materials design, many challenges remain. One of them is to account for the subtle balance between chemical diversity and synthesizability in the autonomous chemical design process. In this work, R-group enumeration from known core chemistry and symmetric attachment points was utilized as a simple measure to circumvent the synthesizability issue without explicitly involving additional scoring functions for synthetic viability. This approach produced new chemistry resembling the available design space and identified novel hole transport materials while maintaining synthetic viability. A next step to expand this work would involve constructing a neural network for the generative model with an explicit synthesizability score integrated into the MPO score. The main hurdle for such an approach is the availability of tools that offer sufficient accuracy over the entire molecular space (<xref ref-type="bibr" rid="B7">Boda et&#x20;al., 2007</xref>; <xref ref-type="bibr" rid="B16">Ertl and Schuffenhauer, 2009</xref>; <xref ref-type="bibr" rid="B15">Emami et&#x20;al., 2015</xref>; <xref ref-type="bibr" rid="B56">Schneider et&#x20;al., 2016</xref>; <xref ref-type="bibr" rid="B12">Coley et&#x20;al., 2018</xref>; <xref ref-type="bibr" rid="B33">Konze et&#x20;al., 2019</xref>). Another method uses the transfer learning approach (<xref ref-type="bibr" rid="B44">Merk et&#x20;al., 2018</xref>), which partially retrains the prior networks for a smaller set of known synthesizable structures. This has been shown to enable the agent networks to be biased toward generating more synthesizable structures for an RNN-based generative model of drug discovery (<xref ref-type="bibr" rid="B58">Segler et&#x20;al., 2018</xref>). Such an approach could potentially drive the design process to start with a much more diverse chemical space, then follow up by fine-tuning the design selections with a smaller set of known hole transport materials. The first step towards this is to survey algorithms to produce synthetic accessibility (SA) generally accepted in the community, generate the SA scores for the training set plus the generated set of compounds in this work, and perform a comparative analysis to assess the validity as well as to enhance the MPO scoring scheme towards the synthesizability. We believe this could be an immediate future work, explicitly considering a more extensive set of operational design rules for OLED materials lifetime.</p>
<p>Aside from refining the algorithms to generate new and improved materials chemistry from the generative model, human intuition and how its construction is integrated into the design process plays a critical role in the goal-directed materials discovery process. The hole transport materials example illustrates the importance of expert input when setting up the desired property space for the model and defining the final design rules that are transferable and interpretable. Ultimately, this is not a single stream design process that starts with fixed neural networks and ends with a few refinements. It is designed to work as an iterative process where the neural network and the scoring scheme get updated with new information and insights obtained recursively from the design ideas and the generative&#x20;model.</p>
</sec>
</sec>
<sec sec-type="conclusion" id="s5">
<title>Conclusion</title>
<p>A goal-directed generative model powered by recurrent neural networks and reinforcement learning algorithms is presented as a new materials discovery strategy in organic electronic applications. High-throughput quantum mechanical calculations and automated machine learning algorithms were combined with the RNN-based generative model to produce novel design ideas for molecular materials based on the desired set of target properties and design rules. Demonstration of the framework with a hole transport material example confirms its value as a design tool that accelerates the materials discovery process based on an unbiased sampling of chemical space while optimizing the properties of the materials.</p>
<p>Retaining similarity to the existing hole transport material design space, the generative model successfully created a new set of design ideas while optimizing for target properties, and exemplified by a multiparameter optimization (MPO) score of 92% compared to related structures in the training set chemistry. Despite using a single MPO score to define the goal in the property space, improvements of all individual properties (<italic>e.g.</italic>, orbital energies, hole reorganization energy, and glass transition temperature) were observed across the design suggestions. Utilizing a few expert design principles, one can construct machine-generated design ideas that are used as valuable ingredients for a set of novel design directives that are set to find the balance between chemical diversity and synthetic viability.</p>
<p>We note that the materials design process presented in this work by the goal-directed generative model is not confined to the organic electronics space but introduces a new data-driven design framework for molecular materials. We believe the introduction of the framework will significantly reduce the development cost for new molecular materials, enabling rapid exploration, and validation of a chemical design&#x20;space.</p>
</sec>
</body>
<back>
<sec id="s6">
<title>Data Availability Statement</title>
<p>The original contributions presented in the study are included in the article/Supplementary Material, further inquiries can be directed to the corresponding authors.</p>
</sec>
<sec id="s7">
<title>Author Contributions</title>
<p>HK performed high-throughput molecular simulations and contributed to building the scorer network. YA built the general model&#x2019;s deep neural networks and ran cheminformatics analysis. HK and YA equally contributed to drafting and revising the manuscript. DG developed automated workflows and user interfaces for physics-based simulations and machine learning predictions. TH built the genetic optimization algorithm to construct the chemical design space for the hole transport materials. KL designed and developed the REINVENT algorithm for the generative model. CB contributed to addressing the core challenges in organic electronic materials design and synthesis and led the final revision of the manuscript. HA and MH provided the management and product development support for computational resources and theoretical analysis.</p>
</sec>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of Interest</title>
<p>HK, YA, DG, TH, CB, KL, HA, and MH were employed by the company Schr&#x00F6;dinger, Inc.</p>
<p>The authors declare that this study received funding from Schr&#x00F6;dinger, Inc. This funder had the following involvement in the study: responsible for the design of the study, data collection, analysis, interpretation of data, the writing of this article, and decision to publish the manuscript.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s Note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<ack>
<p>The authors would like to thank Paul Winget (Schr&#xf6;dinger, Inc.), Steve L. Dixon (Schr&#xf6;dinger Inc.), and Bill Bridges (Schr&#xf6;dinger Inc.) for insightful technical discussions and software/IT support for cloud computing.</p>
</ack>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abd El-Karim</surname>
<given-names>S. S.</given-names>
</name>
<name>
<surname>Anwar</surname>
<given-names>M. M.</given-names>
</name>
<name>
<surname>Syam</surname>
<given-names>Y. M.</given-names>
</name>
<name>
<surname>Nael</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Ali</surname>
<given-names>H. F.</given-names>
</name>
<name>
<surname>Motaleb</surname>
<given-names>M. A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Rational Design and Synthesis of New Tetralin-Sulfonamide Derivatives as Potent Anti-diabetics and DPP-4 Inhibitors: 2D &#x26; 3D QSAR, <italic>In Vivo</italic> Radiolabeling and Bio Distribution Studies</article-title>. <source>Bioorg. Chem.</source> <volume>81</volume>, <fpage>481</fpage>&#x2013;<lpage>493</lpage>. <pub-id pub-id-type="doi">10.1016/j.bioorg.2018.09.021</pub-id> </citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Afzal</surname>
<given-names>M. A. F.</given-names>
</name>
<name>
<surname>Browning</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Halls</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Gavartin</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<name>
<surname>Morisato</surname>
<given-names>T.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>High-Throughput Molecular Dynamics Simulations and Validation of Thermophysical Properties of Polymers for Various Applications</article-title>. <source>ACS Appl. Polym. Mater.</source> <volume>3</volume> (<issue>2</issue>), <fpage>620</fpage>&#x2013;<lpage>630</lpage>. <pub-id pub-id-type="doi">10.1021/acsapm.0c00524</pub-id> </citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Alperstein</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Cherkasov</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Rolfe</surname>
<given-names>J.&#x20;T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>All Smiles Variational Autoencoder</article-title>. <comment>arXiv</comment>. </citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>An</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sherman</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Dixon</surname>
<given-names>S. L.</given-names>
</name>
</person-group> (<year>2012</year>). <article-title>Hole Filling and Library Optimization: Application to Commercially Available Fragment Libraries</article-title>.&#x20;<source>Bioorg. Med. Chem.</source> <volume>20</volume>, <fpage>5379</fpage>&#x2013;<lpage>5387</lpage>. <pub-id pub-id-type="doi">10.1016/j.bmc.2012.03.037</pub-id> </citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>An</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Sherman</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Dixon</surname>
<given-names>S. L.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Kernel-Based Partial Least Squares: Application to Fingerprint-Based QSAR with Model Visualization</article-title>. <source>J.&#x20;Chem. Inf. Model.</source> <volume>53</volume> (<issue>9</issue>), <fpage>2312</fpage>&#x2013;<lpage>2321</lpage>. <pub-id pub-id-type="doi">10.1021/ci400250c</pub-id> </citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bart&#xf3;k</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>De</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Poelking</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Bernstein</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Kermode</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Cs&#xe1;nyi</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Machine Learning Unifies the Modelling of Materials and Molecules</article-title>. <source>Sci. Adv.</source> <volume>3</volume>, <fpage>e1701816</fpage>. <pub-id pub-id-type="doi">10.1126/sciadv.1701816</pub-id> </citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boda</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Seidel</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Gasteiger</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Structure and Reaction Based Evaluation of Synthetic Accessibility</article-title>. <source>J.&#x20;Comput. Aided Mol. Des.</source> <volume>21</volume>, <fpage>311</fpage>&#x2013;<lpage>325</lpage>. <pub-id pub-id-type="doi">10.1007/s10822-006-9099-2</pub-id> </citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Brown</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Fiscato</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Segler</surname>
<given-names>M. H. S.</given-names>
</name>
<name>
<surname>Vaucher</surname>
<given-names>A. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>GuacaMol: Benchmarking Models for De Novo Molecular Design</article-title>. <source>J.&#x20;Chem. Inf. Model.</source> <volume>59</volume>, <fpage>1096</fpage>&#x2013;<lpage>1108</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.8b00839</pub-id> </citation>
</ref>
<ref id="B9">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Buckley</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2013</year>). <source>Organic Light-Emitting Diodes (OLEDs)</source>. <publisher-loc>Philadelphia</publisher-loc>: <publisher-name>Woodhead Publishing Lmtd.</publisher-name> </citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Butler</surname>
<given-names>K. T.</given-names>
</name>
<name>
<surname>Davies</surname>
<given-names>D. W.</given-names>
</name>
<name>
<surname>Cartwright</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Isayev</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Walsh</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Machine Learning for Molecular and Materials Science</article-title>. <source>Nature</source> <volume>559</volume>, <fpage>547</fpage>&#x2013;<lpage>555</lpage>. <pub-id pub-id-type="doi">10.1038/s41586-018-0337-2</pub-id> </citation>
</ref>
<ref id="B11">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Cheng</surname>
<given-names>J.&#x20;Y.-J.</given-names>
</name>
<name>
<surname>Frangos</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Groysberg</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2021</year>). <source>Harvard Business Review</source>. </citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Coley</surname>
<given-names>C. W.</given-names>
</name>
<name>
<surname>Rogers</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Green</surname>
<given-names>W. H.</given-names>
</name>
<name>
<surname>Jensen</surname>
<given-names>K. F.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>SCScore: Synthetic Complexity Learned from a Reaction Corpus</article-title>. <source>J.&#x20;Chem. Inf. Model.</source> <volume>58</volume> (<issue>2</issue>), <fpage>252</fpage>&#x2013;<lpage>261</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.7b00622</pub-id> </citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>de Oliveira</surname>
<given-names>M. T.</given-names>
</name>
<name>
<surname>Katekawa</surname>
<given-names>E.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>On the Virtues of Automated Quantitative Structure-Activity Relationship: the New Kid on the Block</article-title>. <source>Future Med. Chem.</source> <volume>10</volume>, <fpage>335</fpage>&#x2013;<lpage>342</lpage>. <pub-id pub-id-type="doi">10.4155/fmc-2017-0170</pub-id> </citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dixon</surname>
<given-names>S. L.</given-names>
</name>
<name>
<surname>Duan</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Smith</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Von Bargen</surname>
<given-names>C. D.</given-names>
</name>
<name>
<surname>Sherman</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Repasky</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>AutoQSAR: an Automated Machine Learning Tool for Best-Practice Quantitative Structure-Activity Relationship Modeling</article-title>. <source>Future Med. Chem.</source> <volume>8</volume>, <fpage>1825</fpage>&#x2013;<lpage>1839</lpage>. <pub-id pub-id-type="doi">10.4155/fmc-2016-0093</pub-id> </citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Emami</surname>
<given-names>F. S.</given-names>
</name>
<name>
<surname>Vahid</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Wylie</surname>
<given-names>E. K.</given-names>
</name>
<name>
<surname>Szymku&#x107;</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dittwald</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Molga</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>A Priori Estimation of Organic Reaction Yields</article-title>. <source>Angew. Chem. Int. Ed.</source> <volume>54</volume> (<issue>37</issue>), <fpage>10797</fpage>&#x2013;<lpage>10801</lpage>. <pub-id pub-id-type="doi">10.1002/anie.201503890</pub-id> </citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ertl</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Schuffenhauer</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>2009</year>). <article-title>Estimation of Synthetic Accessibility Score of Drug-like Molecules Based on Molecular Complexity and Fragment Contributions</article-title>. <source>J.&#x20;Cheminform</source> <volume>1</volume>, <fpage>8</fpage>. <pub-id pub-id-type="doi">10.1186/1758-2946-1-8</pub-id> </citation>
</ref>
<ref id="B17">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Evans</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Kwak</surname>
<given-names>H. S.</given-names>
</name>
<name>
<surname>Giesen</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Halls</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Oh-e</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Estimation of Charge Carrier Mobility in Amorphous Organic Materials Using Percolation Corrected Random-Walk Model</article-title>. <source>Org. Electro.</source> <volume>29</volume>, <fpage>50</fpage>&#x2013;<lpage>56</lpage>. <pub-id pub-id-type="doi">10.1016/j.orgel.2015.11.021</pub-id> </citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Fujikawa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Ishii</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Tokito</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Taga</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Organic Light-Emitting Diodes Using Triphenylamine Based Hole Transporting Materials</article-title>. <source>MRS Symp. Proc.</source> <volume>621</volume>, <fpage>Q3.4.1</fpage>. <pub-id pub-id-type="doi">10.1557/proc-621-q3.4.1</pub-id> </citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gao</surname>
<given-names>Z. Q.</given-names>
</name>
<name>
<surname>Li</surname>
<given-names>Z. H.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>P. F.</given-names>
</name>
<name>
<surname>Wong</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Cheah</surname>
<given-names>K. W.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>C. H.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Efficient Deep-Blue Organic Light-Emitting Diodes: Arylamine-Substituted Oligofluorenes</article-title>. <source>Adv. Funct. Mater.</source> <volume>17</volume>, <fpage>3194</fpage>&#x2013;<lpage>3199</lpage>. <pub-id pub-id-type="doi">10.1002/adfm.200700238</pub-id> </citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghanakota</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Bos</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Konze</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Staker</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Marques</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Marshall</surname>
<given-names>K.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Combining Cloud-Based Free-Energy Calculations, Synthetically Aware Enumerations, and Goal-Directed Generative Machine Learning for Rapid Large-Scale Chemical Exploration and Optimization</article-title>. <source>J.&#x20;Chem. Inf. Model.</source> <volume>60</volume> (<issue>9</issue>), <fpage>4311</fpage>&#x2013;<lpage>4325</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.0c00120</pub-id> </citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ghiringhelli</surname>
<given-names>L. M.</given-names>
</name>
<name>
<surname>Carbogno</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Levchenko</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mohamed</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Huhs</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>L&#xfc;ders</surname>
<given-names>M.</given-names>
</name>
<etal/>
</person-group> (<year>2017</year>). <article-title>Towards Efficient Data Exchange and Sharing for Big-Data Driven Materials Science: Metadata and Data Formats</article-title>. <source>Npj&#x20;Comput. Mater.</source> <volume>3</volume>, <fpage>46</fpage>. <pub-id pub-id-type="doi">10.1038/s41524-017-0048-5</pub-id> </citation>
</ref>
<ref id="B22">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>G&#xf3;mez-Bombarelli</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Aguilera-Iparraguirre</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Hirzel</surname>
<given-names>T. D.</given-names>
</name>
<name>
<surname>Duvenaud</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Maclaurin</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Blood-Forsythe</surname>
<given-names>M. A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Design of Efficient Molecular Organic Light-Emitting Diodes by a High-Throughput Virtual Screening and Experimental Approach</article-title>. <source>Nat. Mater</source> <volume>15</volume>, <fpage>1120</fpage>&#x2013;<lpage>1127</lpage>. <pub-id pub-id-type="doi">10.1038/nmat4717</pub-id> </citation>
</ref>
<ref id="B23">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Goubard</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Dumur</surname>
<given-names>F.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Truxene: a Promising Scaffold for Future Materials</article-title>. <source>RSC Adv.</source> <volume>5</volume>, <fpage>3521</fpage>&#x2013;<lpage>3551</lpage>. <pub-id pub-id-type="doi">10.1039/c4ra11559g</pub-id> </citation>
</ref>
<ref id="B24">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Halls</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Giesen</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Hughes</surname>
<given-names>T. F.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kwak</surname>
<given-names>H. S.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Accelerated Discovery of OLED Materials Through Atomic-Scale Simulation</article-title>. <source>Proc. SPIE</source>, <fpage>9941</fpage>. <pub-id pub-id-type="doi">10.1117/12.2237940</pub-id> </citation>
</ref>
<ref id="B25">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Halls</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Yoshidome</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Mustard</surname>
<given-names>T. J.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kwak</surname>
<given-names>H. S.</given-names>
</name>
<name>
<surname>Gavartin</surname>
<given-names>J.&#x20;L.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>Atomic-scale Simulation for the Analysis, Optimization and Accelerated Development of Organic Optoelectronic Materials</article-title>. <source>J.&#x20;Imaging Soc. Jpn.</source> <volume>54</volume>, <fpage>561</fpage>&#x2013;<lpage>569</lpage>. <pub-id pub-id-type="doi">10.11370/isj.54.561</pub-id> </citation>
</ref>
<ref id="B26">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Himanen</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Geurts</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Foster</surname>
<given-names>A. S.</given-names>
</name>
<name>
<surname>Rinke</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Data&#x2010;Driven Materials Science: Status, Challenges, and Perspectives</article-title>. <source>Adv. Sci.</source> <volume>6</volume>, <fpage>1900808</fpage>. <pub-id pub-id-type="doi">10.1002/advs.201900808</pub-id> </citation>
</ref>
<ref id="B27">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Iwaloye</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Elekofehinti</surname>
<given-names>O. O.</given-names>
</name>
<name>
<surname>Oluwarotimi</surname>
<given-names>E. A.</given-names>
</name>
<name>
<surname>Kikiowo</surname>
<given-names>B. i.</given-names>
</name>
<name>
<surname>Fadipe</surname>
<given-names>T. M.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Insight into Glycogen Synthase Kinase-3&#x3b2; Inhibitory Activity of Phyto-Constituents from Melissa Officinalis: In Silico Studies</article-title>. <source>Silico Pharmacol.</source> <volume>8</volume>, <fpage>2</fpage>. <pub-id pub-id-type="doi">10.1007/s40203-020-00054-x</pub-id> </citation>
</ref>
<ref id="B28">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jennings</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Lysgaard</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hummelsh&#xf8;j</surname>
<given-names>J.&#x20;S.</given-names>
</name>
<name>
<surname>Vegge</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Bligaard</surname>
<given-names>T.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Genetic Algorithms for Computational Materials Discovery Accelerated by Machine Learning</article-title>. <source>Npj&#x20;Comput. Mater.</source> <volume>5</volume>, <fpage>46</fpage>. <pub-id pub-id-type="doi">10.1038/s41524-019-0181-4</pub-id> </citation>
</ref>
<ref id="B29">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jewell</surname>
<given-names>J.&#x20;T.</given-names>
</name>
<name>
<surname>Khazaie</surname>
<given-names>V. R.</given-names>
</name>
<name>
<surname>Mohsenzadeh</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2021</year>). <article-title>OLED: One-Class Learned Encoder-Decoder Network with Adversarial Context Masking for Novelty Detection</article-title>. <source>arXiv</source>. </citation>
</ref>
<ref id="B30">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jhulki</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Moorthy</surname>
<given-names>J.&#x20;N.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Small Molecular Hole-Transporting Materials (HTMs) in Organic Light-Emitting Diodes (OLEDs): Structural Diversity and Classification</article-title>. <source>J.&#x20;Mater. Chem. C.</source> <volume>6</volume>, <fpage>8280</fpage>&#x2013;<lpage>8325</lpage>. <pub-id pub-id-type="doi">10.1039/c8tc01300d</pub-id> </citation>
</ref>
<ref id="B31">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kimura</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kuwano</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sawaki</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Fujikawa</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Noda</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Taga</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2005</year>). <article-title>New 9-fluorene-type Trispirocyclic Compounds for Thermally Stable Hole Transport Materials in OLEDs</article-title>. <source>J.&#x20;Mater. Chem.</source> <volume>15</volume>, <fpage>2393</fpage>&#x2013;<lpage>2398</lpage>. <pub-id pub-id-type="doi">10.1039/b502268a</pub-id> </citation>
</ref>
<ref id="B32">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kondakova</surname>
<given-names>M. E.</given-names>
</name>
<name>
<surname>Pawlik</surname>
<given-names>T. D.</given-names>
</name>
<name>
<surname>Young</surname>
<given-names>R. H.</given-names>
</name>
<name>
<surname>Giesen</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Kondakov</surname>
<given-names>D. Y.</given-names>
</name>
<name>
<surname>Brown</surname>
<given-names>C. T.</given-names>
</name>
<etal/>
</person-group> (<year>2008</year>). <article-title>High-efficiency, Low-Voltage Phosphorescent Organic Light-Emitting Diode Devices with Mixed Host</article-title>. <source>J.&#x20;Appl. Phys.</source> <volume>104</volume>, <fpage>094501</fpage>. <pub-id pub-id-type="doi">10.1063/1.3000046</pub-id> </citation>
</ref>
<ref id="B33">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Konze</surname>
<given-names>K. D.</given-names>
</name>
<name>
<surname>Bos</surname>
<given-names>P. H.</given-names>
</name>
<name>
<surname>Dahlgren</surname>
<given-names>M. K.</given-names>
</name>
<name>
<surname>Leswing</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Tubert-Brohman</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Bortolato</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Reaction-Based Enumeration, Active Learning, and Free Energy Calculations to Rapidly Explore Synthetically Tractable Chemical Space and Optimize Potency of Cyclin-dependent Kinase 2 Inhibitors</article-title>. <source>J.&#x20;Chem. Inf. Model.</source> <volume>59</volume> (<issue>9</issue>), <fpage>3782</fpage>&#x2013;<lpage>3793</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jcim.9b00367</pub-id> </citation>
</ref>
<ref id="B34">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lee</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>J.&#x20;H.</given-names>
</name>
<name>
<surname>Yang</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Hwang</surname>
<given-names>S. J.</given-names>
</name>
<name>
<surname>Braveenth</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Ha</surname>
<given-names>T. H.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>CN-substituted Ortho-Terphenyl Core Based High Triplet Energy Bipolar Host Materials for Stable and Efficient Blue TADF Devices</article-title>. <source>J.&#x20;Mater. Chem. C.</source> <volume>9</volume>, <fpage>7426</fpage>&#x2013;<lpage>7435</lpage>. <pub-id pub-id-type="doi">10.1039/d1tc01119g</pub-id> </citation>
</ref>
<ref id="B35">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lim</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Ryu</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>J.&#x20;W.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>W. Y.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Molecular Generative Model Based on Conditional Variational Autoencoder for De Novo Molecular Design</article-title>. <source>J.&#x20;Cheminform.</source> <volume>10</volume>, <fpage>31</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-018-0286-7</pub-id> </citation>
</ref>
<ref id="B36">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Liu</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Ju</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Shi</surname>
<given-names>S.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Materials Discovery and Design Using Machine Learning</article-title>. <source>J.&#x20;Materiomics</source> <volume>3</volume>, <fpage>159</fpage>&#x2013;<lpage>177</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmat.2017.08.002</pub-id> </citation>
</ref>
<ref id="B37">
<citation citation-type="book">
<collab>LiveDesign</collab> (<year>2021</year>). <source>LiveDesign Release 8.11</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Schrodinger, LLC</publisher-name>. </citation>
</ref>
<ref id="B38">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>March</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>1985</year>). <source>Advanced Organic Chemistry</source>. <edition>3rd Ed</edition>. <publisher-loc>New York</publisher-loc>: <publisher-name>John Wiley &#x26; Sons</publisher-name>. </citation>
</ref>
<ref id="B39">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Marques</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Leswing</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Robertson</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Giesen</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Halls</surname>
<given-names>M. D.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>De Novo Design of Molecules with Low Hole Reorganization Energy Based on a Quarter-Million Molecule DFT Screen</article-title>. <source>J.&#x20;Phys. Chem. A.</source> <volume>125</volume>, <fpage>7331</fpage>&#x2013;<lpage>7343</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jpca.1c04587</pub-id> </citation>
</ref>
<ref id="B40">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matsuzawa</surname>
<given-names>N. N.</given-names>
</name>
<name>
<surname>Arai</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sasago</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fujii</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mustard</surname>
<given-names>T. J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Massive Theoretical Screen of Hole Conducting Organic Materials in the Heteroacene Family by Using a Cloud-Computing Environment</article-title>. <source>J.&#x20;Phys. Chem. A.</source> <volume>124</volume> (<issue>10</issue>), <fpage>1981</fpage>&#x2013;<lpage>1992</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jpca.9b10998</pub-id> </citation>
</ref>
<ref id="B41">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Matsuzawa</surname>
<given-names>N. N.</given-names>
</name>
<name>
<surname>Arai</surname>
<given-names>H.</given-names>
</name>
<name>
<surname>Sasago</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Fujii</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Mustard</surname>
<given-names>T. J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Massive Theoretical Screen of Hole Conducting Organic Materials in the Heteroacene Family by Using a Cloud-Computing Environment</article-title>. <source>J.&#x20;Phys. Chem. A.</source> <volume>124</volume>, <fpage>1981</fpage>&#x2013;<lpage>1992</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jpca.9b10998</pub-id> </citation>
</ref>
<ref id="B42">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Melnyk</surname>
<given-names>A. R.</given-names>
</name>
<name>
<surname>Pai</surname>
<given-names>D. M.</given-names>
</name>
</person-group> (<year>1990</year>). <article-title>Photoconductors in Electrophotography</article-title>. <source>Proc. SPIE</source>, <fpage>1253</fpage>. </citation>
</ref>
<ref id="B43">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Meredig</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Agrawal</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Kirklin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Saal</surname>
<given-names>J.&#x20;E.</given-names>
</name>
<name>
<surname>Doak</surname>
<given-names>J.&#x20;W.</given-names>
</name>
<name>
<surname>Thompson</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2014</year>). <article-title>Combinatorial Screening for New Materials in Unconstrained Composition Space with Machine Learning</article-title>. <source>Phys. Rev. B</source> <volume>89</volume>, <fpage>094104</fpage>. <pub-id pub-id-type="doi">10.1103/physrevb.89.094104</pub-id> </citation>
</ref>
<ref id="B44">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Merk</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Friedrich</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Grisoni</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Schneider</surname>
<given-names>G.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>De Novo Design of Bioactive Small Molecules by Artificial Intelligence</article-title>. <source>Mol. Inf.</source> <volume>37</volume>, <fpage>1700153</fpage>. <pub-id pub-id-type="doi">10.1002/minf.201700153</pub-id> </citation>
</ref>
<ref id="B45">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Moosavi</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Jablonka</surname>
<given-names>K. M.</given-names>
</name>
<name>
<surname>Smit</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The Role of Machine Learning in the Understanding and Design of Materials</article-title>. <source>J.&#x20;Am. Chem. Soc.</source> <volume>142</volume>, <fpage>20273</fpage>&#x2013;<lpage>20287</lpage>. <pub-id pub-id-type="doi">10.1021/jacs.0c09105</pub-id> </citation>
</ref>
<ref id="B46">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murahari</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Mahajan</surname>
<given-names>V.</given-names>
</name>
<name>
<surname>Neeladri</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Kumar</surname>
<given-names>M. S.</given-names>
</name>
<name>
<surname>Mayur</surname>
<given-names>Y. C.</given-names>
</name>
</person-group> (<year>2019</year>). <article-title>Ligand Based Design and Synthesis of Pyrazole Based Derivatives as Selective COX-2 Inhibitors</article-title>. <source>Bioorg. Chem.</source> <volume>86</volume>, <fpage>583</fpage>&#x2013;<lpage>597</lpage>. <pub-id pub-id-type="doi">10.1016/j.bioorg.2019.02.031</pub-id> </citation>
</ref>
<ref id="B47">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Murdock</surname>
<given-names>S. E.</given-names>
</name>
<name>
<surname>Hughes</surname>
<given-names>T. F.</given-names>
</name>
<name>
<surname>Kwak</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Goldberg</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Giesen</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Cao</surname>
<given-names>Y.</given-names>
</name>
<etal/>
</person-group> (<year>2015</year>). <article-title>Discovery of New Anode SEI Forming Additives Using an In Silico Evolutionary Approach</article-title>. <source>ECS Trans.</source> <volume>69</volume>, <fpage>67</fpage>&#x2013;<lpage>74</lpage>. <pub-id pub-id-type="doi">10.1149/06901.0067ecst</pub-id> </citation>
</ref>
<ref id="B48">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Naito</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Miura</surname>
<given-names>A.</given-names>
</name>
</person-group> (<year>1993</year>). <article-title>Molecular Design for Nonpolymeric Organic Dye Glasses with thermal Stability: Relations between Thermodynamic Parameters and Amorphous Properties</article-title>. <source>J.&#x20;Phys. Chem.</source> <volume>97</volume>, <fpage>6240</fpage>&#x2013;<lpage>6248</lpage>. <pub-id pub-id-type="doi">10.1021/j100125a025</pub-id> </citation>
</ref>
<ref id="B49">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nisbet</surname>
<given-names>M. L.</given-names>
</name>
<name>
<surname>Pendleton</surname>
<given-names>I. M.</given-names>
</name>
<name>
<surname>Nolis</surname>
<given-names>G. M.</given-names>
</name>
<name>
<surname>Griffith</surname>
<given-names>K. J.</given-names>
</name>
<name>
<surname>Schrier</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Cabana</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Machine-Learning-Assisted Synthesis of Polar Racemates</article-title>. <source>J.&#x20;Am. Chem. Soc.</source> <volume>142</volume>, <fpage>7555</fpage>&#x2013;<lpage>7566</lpage>. <pub-id pub-id-type="doi">10.1021/jacs.0c01239</pub-id> </citation>
</ref>
<ref id="B50">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Olivecrona</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Blaschke</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Engkvist</surname>
<given-names>O.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2017</year>). <article-title>Molecular De-novo Design through Deep Reinforcement Learning</article-title>. <source>J.&#x20;Cheminform.</source> <volume>9</volume>, <fpage>48</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-017-0235-x</pub-id> </citation>
</ref>
<ref id="B51">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Pilania</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Jiang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Rajasekaran</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Ramprasad</surname>
<given-names>R.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Accelerating Materials Property Predictions Using Machine Learning</article-title>. <source>Sci. Rep.</source> <volume>3</volume>, <fpage>2810</fpage>. <pub-id pub-id-type="doi">10.1038/srep02810</pub-id> </citation>
</ref>
<ref id="B52">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Raccuglia</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Elbert</surname>
<given-names>K. C.</given-names>
</name>
<name>
<surname>Adler</surname>
<given-names>P. D. F.</given-names>
</name>
<name>
<surname>Falk</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Wenny</surname>
<given-names>M. B.</given-names>
</name>
<name>
<surname>Mollo</surname>
<given-names>A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Machine-learning-assisted Materials Discovery Using Failed Experiments</article-title>. <source>Nature</source> <volume>533</volume>, <fpage>73</fpage>&#x2013;<lpage>76</lpage>. <pub-id pub-id-type="doi">10.1038/nature17439</pub-id> </citation>
</ref>
<ref id="B53">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rogers</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Hahn</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Extended-Connectivity Fingerprints</article-title>. <source>J.&#x20;Chem. Inf. Model.</source> <volume>50</volume>, <fpage>742</fpage>&#x2013;<lpage>754</lpage>. <pub-id pub-id-type="doi">10.1021/ci100050t</pub-id> </citation>
</ref>
<ref id="B54">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schmidbauer</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Hohenleutner</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>K&#xf6;nig</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2013</year>). <article-title>Chemical Degradation in Organic Light-Emitting Devices: Mechanisms and Implications for the Design of New Materials</article-title>. <source>Adv. Mater.</source> <volume>25</volume>, <fpage>2114</fpage>&#x2013;<lpage>2129</lpage>. <pub-id pub-id-type="doi">10.1002/adma.201205022</pub-id> </citation>
</ref>
<ref id="B55">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schneider</surname>
<given-names>G.</given-names>
</name>
<name>
<surname>Fechner</surname>
<given-names>U.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Computer-based De Novo Design of Drug-like Molecules</article-title>. <source>Nat. Rev. Drug Discov.</source> <volume>4</volume>, <fpage>649</fpage>&#x2013;<lpage>663</lpage>. <pub-id pub-id-type="doi">10.1038/nrd1799</pub-id> </citation>
</ref>
<ref id="B56">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Schneider</surname>
<given-names>N.</given-names>
</name>
<name>
<surname>Lowe</surname>
<given-names>D. M.</given-names>
</name>
<name>
<surname>Sayle</surname>
<given-names>R. A.</given-names>
</name>
<name>
<surname>Tarselli</surname>
<given-names>M. A.</given-names>
</name>
<name>
<surname>Landrum</surname>
<given-names>G. A.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Big Data from Pharmaceutical Patents: A Computational Analysis of Medicinal Chemists&#x27; Bread and Butter</article-title>. <source>J.&#x20;Med. Chem.</source> <volume>59</volume> (<issue>9</issue>), <fpage>4385</fpage>&#x2013;<lpage>4402</lpage>. <pub-id pub-id-type="doi">10.1021/acs.jmedchem.6b00153</pub-id> </citation>
</ref>
<ref id="B57">
<citation citation-type="book">
<collab>Schr&#xf6;dinger</collab> (<year>2021</year>). <source>Schr&#xf6;dinger Release 2021-2: Materials Science Suite</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>Schr&#xf6;dinger, LLC</publisher-name>. </citation>
</ref>
<ref id="B58">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Segler</surname>
<given-names>M. H. S.</given-names>
</name>
<name>
<surname>Kogej</surname>
<given-names>T.</given-names>
</name>
<name>
<surname>Tyrchan</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Waller</surname>
<given-names>M. P.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>Generating Focused Molecule Libraries for Drug Discovery with Recurrent Neural Networks</article-title>. <source>ACS Cent. Sci.</source> <volume>4</volume> (<issue>1</issue>), <fpage>120</fpage>&#x2013;<lpage>131</lpage>. <pub-id pub-id-type="doi">10.1021/acscentsci.7b00512</pub-id> </citation>
</ref>
<ref id="B59">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shahnawaz</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Sudheendran Swayamprabha</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Nagar</surname>
<given-names>M. R.</given-names>
</name>
<name>
<surname>Yadav</surname>
<given-names>R. A. K.</given-names>
</name>
<name>
<surname>Gull</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Dubey</surname>
<given-names>D. K.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Hole-transporting Materials for Organic Light-Emitting Diodes: an Overview</article-title>. <source>J.&#x20;Mater. Chem. C.</source> <volume>7</volume>, <fpage>7144</fpage>&#x2013;<lpage>7158</lpage>. <pub-id pub-id-type="doi">10.1039/c9tc01712g</pub-id> </citation>
</ref>
<ref id="B60">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shalf</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>The Future of Computing beyond Moore&#x27;s Law</article-title>. <source>Phil. Trans. R. Soc. A.</source> <volume>378</volume>, <fpage>20190061</fpage>. <pub-id pub-id-type="doi">10.1098/rsta.2019.0061</pub-id> </citation>
</ref>
<ref id="B61">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shi</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>J.-Y.</given-names>
</name>
<name>
<surname>Pei</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2015</year>). <article-title>&#x3c0;-Conjugated Aromatics Based on Truxene: Synthesis, Self-Assembly, and Applications</article-title>. <source>Chem. Rec.</source> <volume>15</volume>, <fpage>52</fpage>&#x2013;<lpage>72</lpage>. <pub-id pub-id-type="doi">10.1002/tcr.201402071</pub-id> </citation>
</ref>
<ref id="B62">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shirota</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kageyama</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2007</year>). <article-title>Charge Carrier Transporting Molecular Materials and Their Applications in Devices</article-title>. <source>Chem. Rev.</source> <volume>107</volume>, <fpage>953</fpage>&#x2013;<lpage>1010</lpage>. <pub-id pub-id-type="doi">10.1021/cr050143&#x2b;</pub-id> </citation>
</ref>
<ref id="B63">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shirota</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2000</year>). <article-title>Organic Materials for Electronic and Optoelectronic Devices</article-title>. <source>J.&#x20;Mater. Chem.</source> <volume>10</volume>, <fpage>1</fpage>&#x2013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1039/a908130e</pub-id> </citation>
</ref>
<ref id="B64">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shukla</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Welter</surname>
<given-names>T. R.</given-names>
</name>
<name>
<surname>Robello</surname>
<given-names>D. R.</given-names>
</name>
<name>
<surname>Giesen</surname>
<given-names>D. J.</given-names>
</name>
<name>
<surname>Lenhard</surname>
<given-names>J.&#x20;R.</given-names>
</name>
<name>
<surname>Ahearn</surname>
<given-names>W. G.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Dioxapyrene-Based Organic Semiconductors for Organic Field Effect Transistors</article-title>. <source>J.&#x20;Phys. Chem. C.</source> <volume>113</volume>, <fpage>14482</fpage>&#x2013;<lpage>14486</lpage>. <pub-id pub-id-type="doi">10.1021/jp903472q</pub-id> </citation>
</ref>
<ref id="B65">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>So</surname>
<given-names>F.</given-names>
</name>
<name>
<surname>Kondakov</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2010</year>). <article-title>Degradation Mechanisms in Small-Molecule and Polymer Organic Light-Emitting Diodes</article-title>. <source>Adv. Mater.</source> <volume>22</volume>, <fpage>3762</fpage>&#x2013;<lpage>3777</lpage>. <pub-id pub-id-type="doi">10.1002/adma.200902624</pub-id> </citation>
</ref>
<ref id="B66">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>St. John</surname>
<given-names>P. C.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Paton</surname>
<given-names>R. S.</given-names>
</name>
<name>
<surname>Paton</surname>
<given-names>R. S.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>Prediction of Organic Homolytic Bond Dissociation Enthalpies at Near Chemical Accuracy with Sub-second Computational Cost</article-title>. <source>Nat. Commun.</source> <volume>11</volume>, <fpage>2328</fpage>. <pub-id pub-id-type="doi">10.1038/s41467-020-16201-z</pub-id> </citation>
</ref>
<ref id="B67">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Truhlar</surname>
<given-names>D. G.</given-names>
</name>
<name>
<surname>Cramer</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Lewis</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Bumpus</surname>
<given-names>J.&#x20;A.</given-names>
</name>
</person-group> (<year>2004</year>). <article-title>Molecular Modeling of Environmentally Important Processes: Reduction Potentials</article-title>. <source>J.&#x20;Chem. Educ.</source> <volume>81</volume>, <fpage>596</fpage>. <pub-id pub-id-type="doi">10.1021/ed081p596</pub-id> </citation>
</ref>
<ref id="B68">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Vor&#x161;il&#xe1;k</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kolar</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Cmelo</surname>
<given-names>I.</given-names>
</name>
<name>
<surname>Svozil</surname>
<given-names>D.</given-names>
</name>
</person-group> (<year>2020</year>). <article-title>SYBA: Bayesian Estimation of Synthetic Accessibility of Organic Compounds</article-title>. <source>J.&#x20;Cheminform.</source> <volume>12</volume>, <fpage>35</fpage>. <pub-id pub-id-type="doi">10.1186/s13321-020-00439-2</pub-id> </citation>
</ref>
<ref id="B69">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Wei</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>X. Y.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>K.</given-names>
</name>
<name>
<surname>Deng</surname>
<given-names>H. X.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2019</year>). <article-title>Machine Learning in Materials Science</article-title>. <source>InfoMat</source> <volume>1</volume>, <fpage>338</fpage>&#x2013;<lpage>358</lpage>. <pub-id pub-id-type="doi">10.1002/inf2.12028</pub-id> </citation>
</ref>
<ref id="B70">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xie</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Hu</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Kelley</surname>
<given-names>S. P.</given-names>
</name>
<name>
<surname>Atwood</surname>
<given-names>J.&#x20;L.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Machine Learning Assisted Synthesis of Metal-Organic Nanocapsules</article-title>. <source>J.&#x20;Am. Chem. Soc.</source> <volume>142</volume>, <fpage>1475</fpage>&#x2013;<lpage>1481</lpage>. <pub-id pub-id-type="doi">10.1021/jacs.9b11569</pub-id> </citation>
</ref>
<ref id="B71">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2005</year>). <article-title>Prediction of Glass Transition Temperatures of OLED Materials Using Topological Indices</article-title>. <source>J.&#x20;Mol. Model.</source> <volume>12</volume>, <fpage>24</fpage>&#x2013;<lpage>33</lpage>. <pub-id pub-id-type="doi">10.1007/s00894-005-0282-5</pub-id> </citation>
</ref>
<ref id="B72">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>He</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Xue</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Guo</surname>
<given-names>Q.</given-names>
</name>
<name>
<surname>Xia</surname>
<given-names>H.</given-names>
</name>
<etal/>
</person-group> (<year>2009</year>). <article-title>Solution-processable and thermal-stable Triphenylamine-Based Dendrimers with Truxene Cores as Hole-Transporting Materials for Organic Light-Emitting Devices</article-title>. <source>Org. Electro.</source> <volume>10</volume>, <fpage>954</fpage>&#x2013;<lpage>959</lpage>. <pub-id pub-id-type="doi">10.1016/j.orgel.2009.04.024</pub-id> </citation>
</ref>
<ref id="B73">
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Yarnell</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Lemonick</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Mullin</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Patel</surname>
<given-names>P.</given-names>
</name>
</person-group> (<year>2021</year>). <source>ACS Discovery Report, Q2</source>. </citation>
</ref>
<ref id="B74">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Yin</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Shuai</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
</person-group> (<year>2003</year>). <article-title>A Quantitative Structure&#x2212;Property Relationship Study of the Glass Transition Temperature of OLED Materials</article-title>. <source>J.&#x20;Chem. Inf. Comput. Sci.</source> <volume>43</volume>, <fpage>970</fpage>&#x2013;<lpage>977</lpage>. <pub-id pub-id-type="doi">10.1021/ci034011y</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>