<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Toxicol.</journal-id>
<journal-title>Frontiers in Toxicology</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Toxicol.</abbrev-journal-title>
<issn pub-type="epub">2673-3080</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1437884</article-id>
<article-id pub-id-type="doi">10.3389/ftox.2024.1437884</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Toxicology</subject>
<subj-group>
<subject>Technology and Code</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Transforming environmental health datasets from the comparative toxicogenomics database into chord diagrams to visualize molecular mechanisms</article-title>
<alt-title alt-title-type="left-running-head">Wyatt et al.</alt-title>
<alt-title alt-title-type="right-running-head">
<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.3389/ftox.2024.1437884">10.3389/ftox.2024.1437884</ext-link>
</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Wyatt</surname>
<given-names>Brent</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1261680/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/methodology/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Davis</surname>
<given-names>Allan Peter</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1900367/overview"/>
<role content-type="https://credit.niso.org/contributor-roles/conceptualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/investigation/"/>
<role content-type="https://credit.niso.org/contributor-roles/supervision/"/>
<role content-type="https://credit.niso.org/contributor-roles/validation/"/>
<role content-type="https://credit.niso.org/contributor-roles/visualization/"/>
<role content-type="https://credit.niso.org/contributor-roles/writing-original-draft/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wiegers</surname>
<given-names>Thomas C.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Wiegers</surname>
<given-names>Jolene</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Abrar</surname>
<given-names>Sakib</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/software/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Sciaky</surname>
<given-names>Daniela</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Barkalow</surname>
<given-names>Fern</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Strong</surname>
<given-names>Melissa</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/data-curation/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Mattingly</surname>
<given-names>Carolyn J.</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<role content-type="https://credit.niso.org/contributor-roles/funding-acquisition/"/>
<role content-type="https://credit.niso.org/contributor-roles/project-administration/"/>
<role content-type="https://credit.niso.org/contributor-roles/Writing - review &#x26; editing/"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>Department of Biological Sciences</institution>, <institution>North Carolina State University</institution>, <addr-line>Raleigh</addr-line>, <addr-line>NC</addr-line>, <country>United States</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Center for Human Health and the Environment</institution>, <institution>North Carolina State University</institution>, <addr-line>Raleigh</addr-line>, <addr-line>NC</addr-line>, <country>United States</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/691669/overview">Agnes Karmaus</ext-link>, Integrated Laboratory Systems, Inc., United States</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/284335/overview">Jui-Hua Hsieh</ext-link>, National Institute of Environmental Health Sciences (NIH), United States</p>
<p>
<ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/2756329/overview">Kimberly T. To</ext-link>, Integrated Laboratory Systems, Inc., United States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Allan Peter Davis, <email>apdavis3@ncsu.edu</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>22</day>
<month>07</month>
<year>2024</year>
</pub-date>
<pub-date pub-type="collection">
<year>2024</year>
</pub-date>
<volume>6</volume>
<elocation-id>1437884</elocation-id>
<history>
<date date-type="received">
<day>24</day>
<month>05</month>
<year>2024</year>
</date>
<date date-type="accepted">
<day>26</day>
<month>06</month>
<year>2024</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2024 Wyatt, Davis, Wiegers, Wiegers, Abrar, Sciaky, Barkalow, Strong and Mattingly.</copyright-statement>
<copyright-year>2024</copyright-year>
<copyright-holder>Wyatt, Davis, Wiegers, Wiegers, Abrar, Sciaky, Barkalow, Strong and Mattingly</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p>
</license>
</permissions>
<abstract>
<p>In environmental health, the specific molecular mechanisms connecting a chemical exposure to an adverse endpoint are often unknown, reflecting knowledge gaps. At the public Comparative Toxicogenomics Database (CTD; <ext-link ext-link-type="uri" xlink:href="https://ctdbase.org/">https://ctdbase.org/</ext-link>), we integrate manually curated, literature-based interactions from CTD to compute four-unit blocks of information organized as a potential step-wise molecular mechanism, known as &#x201c;CGPD-tetramers,&#x201d; wherein a chemical interacts with a gene product to trigger a phenotype which can be linked to a disease. These computationally derived datasets can be used to fill the gaps and offer testable mechanistic information. Users can generate CGPD-tetramers for any combination of chemical, gene, phenotype, and/or disease of interest at CTD; however, such queries typically result in the generation of thousands of CGPD-tetramers. Here, we describe a novel approach to transform these large datasets into user-friendly chord diagrams using R. This visualization process is straightforward, simple to implement, and accessible to inexperienced users that have never used R before. Combining CGPD-tetramers into a single chord diagram helps identify potential key chemicals, genes, phenotypes, and diseases. This visualization allows users to more readily analyze computational datasets that can fill the exposure knowledge gaps in the environmental health continuum.</p>
</abstract>
<kwd-group>
<kwd>data visualization</kwd>
<kwd>chord diagram</kwd>
<kwd>r</kwd>
<kwd>molecular mechanisms</kwd>
<kwd>environmental health</kwd>
<kwd>database</kwd>
<kwd>tetramers</kwd>
</kwd-group>
<custom-meta-wrap>
<custom-meta>
<meta-name>section-at-acceptance</meta-name>
<meta-value>Computational Toxicology and Informatics</meta-value>
</custom-meta>
</custom-meta-wrap>
</article-meta>
</front>
<body>
<sec id="s1">
<title>1 Introduction</title>
<p>Chemicals are important environmental factors that can affect human health, yet the molecular mechanisms connecting an exposure to an adverse outcome often remain unknown, reflecting knowledge and information gaps in the continuum (<xref ref-type="bibr" rid="B20">Thessen et al., 2020</xref>). The Comparative Toxicogenomics Database (CTD; <ext-link ext-link-type="uri" xlink:href="https://ctdbase.org">https://ctdbase.org</ext-link>) is an innovative public resource that provides manually curated information from the scientific literature to harmonize and centralize cross-species data for chemical exposures and their interactions with genes, phenotypes (non-disease biological processes), and diseases (<xref ref-type="bibr" rid="B6">Davis et al., 2023a</xref>). Currently, CTD includes 3.5 million manually curated interactions relating 17,600 chemicals, 55,000 genes, 6,600 phenotypes, and 7,300 diseases. Additionally, CTD leverages data integration strategies to compute potential molecular mechanistic solutions that help fill knowledge gaps between exposure and adverse outcomes; presently, CTD generates over 88 million toxicogenomic relationships for users to explore (<ext-link ext-link-type="uri" xlink:href="https://ctdbase.org/about/dataStatus.go">https://ctdbase.org/about/dataStatus.go</ext-link>). CTD datasets have been used to analyze diverse environmental health issues, including ozone-induced myocardial infarction (<xref ref-type="bibr" rid="B5">Davis et al., 2020</xref>), arsenic-linked male reproductive defects (<xref ref-type="bibr" rid="B2">Chai et al., 2021</xref>), heavy metal-associated depression (<xref ref-type="bibr" rid="B16">Nguyen and Kim, 2023</xref>), fatty liver disease resulting from perfluorooctane sulfonate (<xref ref-type="bibr" rid="B14">Kim et al., 2023</xref>), chemical-induced pulmonary fibrosis (<xref ref-type="bibr" rid="B13">Jeong et al., 2023</xref>), and hepatic toxicity from bisphenol exposure (<xref ref-type="bibr" rid="B21">Zhao et al., 2024</xref>).</p>
<p>Through data integration and novel analytical approaches, CTD has the capacity to provide insights into complex mechanistic relationships between chemical exposures and adverse outcomes by generating &#x201c;CGPD-tetramers&#x201d;: four-unit computational blocks of information that link an initiating Chemical with a Gene to modulate a Phenotype that can be inferred to a Disease outcome (<xref ref-type="bibr" rid="B5">Davis et al., 2020</xref>). To compute a tetramer, five independently, manually curated relationships in CTD are integrated, including a chemical-gene interaction, a chemical-phenotype interaction, a chemical-disease interaction, a gene-disease interaction, and a gene-phenotype annotation (<xref ref-type="fig" rid="F1">Figure 1A</xref>). A new analytical tool called &#x201c;CTD Tetramers&#x201d; (<xref ref-type="bibr" rid="B8">Davis et al., 2023b</xref>) allows users to generate CGPD-tetramers for any chemical, gene, phenotype, or disease of interest (<xref ref-type="fig" rid="F1">Figure 1B</xref>). However, most queries typically return hundreds or thousands of tetramers, displayed as a web-based table, wherein the content can be sorted or downloaded.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>
<bold>(A)</bold> A CGPD-tetramer is computationally generated by data integration only if five independently curated interactions (1&#x2013;5) currently exist in CTD, interrelating a chemical (C), gene (G), phenotype (P), and disease (D). <bold>(B)</bold> A new analytical tool called &#x201c;CTD Tetramers&#x201d; (<ext-link ext-link-type="uri" xlink:href="https://ctdbase.org/query.go?type=tetramer">https://ctdbase.org/query.go?type&#x3d;tetramer</ext-link>) enables users to generate their own tetramers by providing one or more chemical, gene, phenotype, or disease terms of interest. Here, &#x201c;chromium&#x201d; is entered as the chemical of interest, and CTD computationally generates 832 unique tetramers for this environmental metal with its associated gene, phenotype, and disease components. The query results are displayed as a sortable web-page table and can be downloaded as a file in different formats, including CSV.</p>
</caption>
<graphic xlink:href="ftox-06-1437884-g001.tif"/>
</fig>
<p>To extend the analysis of these large CTD Tetramer query results, we describe a novel method to transform CGPD-tetramers into a chord diagram that allows patterns and relationships to be more easily recognized. The diagram links information in a circular layout by listing the data types as nodes around the circumference of the circle and using arcs to depict the connecting relationships among the nodes. Each time a relationship is plotted, the corresponding node gets larger, and as nodes and arcs grow in length and width, it becomes visually apparent which components occur most frequently (<xref ref-type="fig" rid="F2">Figure 2</xref>). This approach allows all the CGPD-tetramers from a table to be combined and visualized in a single graph, facilitating the identification of potentially key mechanistic elements connecting a chemical exposure to a disease endpoint.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>A schematic of how multiple CGPD-tetramers are converted into a single chord diagram. Here, for simplicity, only three tetramers are used, involving one chemical, two genes, two phenotypes, and one disease that are displayed as a web-table, and can be downloaded as a file in CSV format. Using R, individual dimer relationships between unique chemicals (C), genes (G), phenotypes (P), and diseases (D) in the tetramer set are first formatted; then, the number of unique dimer frequencies are counted and this value is used to scale the corresponding length of the node and width of the connecting arcs for each data type. Chord diagrams offer a more pleasing visual representation of the same data seen in a table, but enables key elements to be more easily recognized due to the scaled length and width of the nodes and arcs, respectively. Diagrams are read in a clockwise direction, in the same order that a CGPD-tetramer is read: here, the initiating chemical (Ozone) interacts with two genes (PTGFR and TFPI), which in turn modulate two phenotypes (inflammatory response and response to lipopolysaccharide), ending in the disease airway obstruction. The scaled dimensions of the nodes and arcs reflect the frequency of the terms in the total tetramer set, allowing potential key mechanisms to be more easily identified (here, ozone, PTGFR, and response to lipopolysaccharides are overrepresented in this simplistic illustration). The four data types are color-coded to facilitate demarcation in the diagram, using a blue palette (for chemicals), green palette (for genes), purple palette (for phenotypes), and red palette (for diseases).</p>
</caption>
<graphic xlink:href="ftox-06-1437884-g002.tif"/>
</fig>
<p>The chord diagrams are compact, elegant representations of complex tetramer datasets. To generate these diagrams, we make use of R, a widely used and publicly available programming environment that can be run on all major operating systems, including Windows, MacOS, and Linux. The R-based script and instructions that we provide are easy to learn, so that even novice users can quickly begin creating chord diagrams illuminating CTD tetramer results.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>2 Methods</title>
<sec id="s2-1">
<title>2.1 CTD data version and analysis</title>
<p>Analysis was performed using CTD public data available (revision 17,266; March 2024). CTD is updated with new content on a monthly basis (<ext-link ext-link-type="uri" xlink:href="https://ctdbase.org/about/dataStatus.go">https://ctdbase.org/about/dataStatus.go</ext-link>); consequently, query results described in this text may vary over time.</p>
</sec>
<sec id="s2-2">
<title>2.2 R environment</title>
<p>The freely available version 4.4.0 of R (<ext-link ext-link-type="uri" xlink:href="https://www.r-project.org">https://www.r-project.org</ext-link>) was used (<xref ref-type="bibr" rid="B17">R Core Team, 2018</xref>). The R package data.table version 1.15.2 (<ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/package=data.table">https://CRAN.R-project.org/package&#x3d;data.table</ext-link>) was used in preparing the data and the R package circlize version 0.4.16 (<ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/package=circlize">https://CRAN.R-project.org/package&#x3d;circlize</ext-link>) was used to generate the chord diagrams (<xref ref-type="bibr" rid="B10">Gu et al., 2014</xref>). To format CGPD-tetramers and plot a basic chord diagram, download the <italic>CTD-vizscript.R</italic>, from GitHub (<ext-link ext-link-type="uri" xlink:href="https://github.com/CTD-NCSU/Chord_Diagrams">https://github.com/CTD-NCSU/Chord_Diagrams</ext-link>) or use the version included with a dataset of test tetramers (&#x201c;test.csv&#x201d;) for practice (<xref ref-type="sec" rid="s10">Supplemental File S1</xref>). For CTD users unfamiliar with R, it is not necessary to download local versions of the software to generate the chord diagrams. Instead, a free, web-based version of R and RStudio environment from Posit Cloud (<ext-link ext-link-type="uri" xlink:href="https://posit.cloud">https://posit.cloud</ext-link>) may be used to generate the diagrams; users will need to first create a free account at Posit Cloud, and the steps required using the latter method are provided below.</p>
</sec>
<sec id="s2-3">
<title>2.3 Basic steps for CTD tetramer visualization using web-based Posit Cloud</title>
<p>Step 1: Download CTD Tetramers query results in CSV format (and rename the file to something more intuitive); start with a dataset of no more than 1,500 tetramers (discussed below); alternatively, use the test sample CSV file provided as &#x201c;test.csv&#x201d; (<xref ref-type="sec" rid="s10">Supplemental File S1</xref>), which contains 309 CGPD-tetramers composed of two chemicals (copper and iron), 61 genes, 87 phenotypes, and 1 disease (liver neoplasms).</p>
<p>Step 2: Download <italic>CTD-vizscript.R</italic> locally from GitHub (<ext-link ext-link-type="uri" xlink:href="https://github.com/CTD-NCSU/Chord_Diagrams">https://github.com/CTD-NCSU/Chord_Diagrams</ext-link>) or use the provided file (<xref ref-type="sec" rid="s10">Supplemental File S1</xref>)</p>
<p>Step 3: Create a free account at Posit Cloud (<ext-link ext-link-type="uri" xlink:href="https://posit.cloud">https://posit.cloud</ext-link>) and log in to the &#x201c;Your Workspace&#x201d; web page.</p>
<p>Step 4: On the right-hand side of the workspace web page, click on the &#x201c;New Project&#x201d; button and select &#x201c;New RStudio Project&#x201d; from the drop-down menu. The browser will reload showing three panes: &#x201c;Console&#x201d; in the upper left, &#x201c;Environment&#x201d; in the upper right, and &#x201c;Files&#x201d; in the bottom right; browser screenshots for the subsequent steps are provided (<xref ref-type="sec" rid="s10">Supplemental File S2</xref>). In the bottom right pane (&#x201c;Files&#x201d;), click on the &#x201c;Upload&#x201d; button to browse for and select the downloaded copy of <italic>CTD-vizscript.R</italic> file (panel A, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>); then upload the CSV formatted file of the CTD Tetramer query results that are to be visualized, or use the provided sample file <italic>&#x201c;</italic>test.csv.<italic>&#x201d;</italic> Both files will now be listed in the &#x201c;Files&#x201d; pane.</p>
<p>Step 5: Click on the <italic>CTD-vizscript.R</italic> file and the script will appear in a new upper left-hand pane (and &#x201c;Console&#x201d; will displace to the bottom left). An alert will pop up and ask to install circlize and data.table. Choose install (panel C, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). In the &#x201c;Console&#x201d; window, you&#x2019;ll see the program run until it is finished.</p>
<p>Step 6: Load data.table and circlize using the library() command to make them available for future steps. To do this, go to code lines 2&#x2013;3 and execute the two lines of the script by using the cursor to physically highlight the two lines for library(data.table) and library(circlize) in the window pane, and then click &#x201c;Run&#x201d; button (panel D, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>).</p>
<p>Step 7: Under &#x201c;&#x23;Import data,&#x201d; at code line 6 assign the name of the CTD Tetramer query result file to the variable &#x201c;tetramers&#x201d; (panel E, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). To do this, type in the exact name of the file, which is case-sensitive, surrounded by quotation marks, and suffixed with &#x201c;.csv,&#x201d; all enclosed with the parentheses. For example, if using the provided test file (test.csv), then set the line to read: tetramers &#x3c; - read.csv(&#x201c;test.csv&#x201d;). The case-sensitive file name must be spelled exactly, contain the CSV suffix, be flanked by quotation marks, and enclosed in the parentheses.</p>
<p>Step 8: Using the cursor, highlight the line from step 7 (where the tetramer file name is entered on code line 6) along with the rest of the script to code line 60 (panel F, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). Click the &#x201c;Run&#x201d; button.</p>
<p>Step 9: If everything runs successfully, the tool will generate a colored chord diagram in the lower right pane under &#x201c;Plots&#x201d; (panel I, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). This process can take a few minutes, depending upon the total number of CGPD-tetramers that are being graphed. See below for common errors that might arise. To adjust the font size of the labels, go to code line 59 and find &#x201c;cex &#x3d; &#x201d; near the end of the script under &#x201c;&#x23;&#x23; Add labels to diagram&#x201d; (panel H, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). &#x201c;cex&#x201d; stands for &#x201c;character expansion&#x201d; and is the parameter that changes the font size of the node labels. It has a default value of 1; to make the font size smaller, the parameter can be changed to a value between 0 and 1; for example, cex &#x3d; 0.5 will result in text that is 50% smaller than the default value. Changing the parameter to a value greater than 1 will result in larger text; for example, cex &#x3d; 1.5 will result in text that is 50% larger than the default value. The greater the number of tetramers being plotted, the smaller the value of cex should be in order for the labels to be clearly separated and not overlapping. Additionally, or alternatively, for very large sets of tetramers where the node labels are difficult to resolve, a user might instead prefer to display only the node accession identifiers, as discussed below. After changing the value of cex, go to code line 45 and highlight the text beginning with circos.clear along with the remaining script, and click &#x201c;Run&#x201d;. This is necessary to clear out the old data and rerun the program using the newly entered values.</p>
<p>Step 10: The chord diagram can be saved as either a PDF or an image by clicking the &#x201c;Export&#x201d; button under the &#x201c;Plots&#x201d; tab of the lower right-hand pane (panel I, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>).</p>
</sec>
<sec id="s2-4">
<title>2.4 Fixing common errors that might be encountered</title>
<p>Common error 1: An error that states Error in setDT(cgpd): could not find function &#x201c;setDT&#x201d; indicates the data.table package is not loaded. Highlight the line that says library(data.table) near the top of the script (code line 2) and click &#x201c;Run.&#x201d; This will make the function &#x201c;setDT&#x201d; available.</p>
<p>Common error 2: An error that states any of the following are not found, &#x201c;circos.clear,&#x201d; &#x201c;circos.par,&#x201d; &#x201c;chordDiagram,&#x201d; or &#x201c;circos.track, indicates the circlize package is not loaded. Highlight code line 3 that says library(circlize) and click &#x201c;Run.&#x201d; This will make those functions available.</p>
<p>Common error 3: An error that states &#x201c;Maybe your &#x201c;gap.degree&#x201d; is too large so that there is no space to allocate sectors&#x201d; indicates that there is a very large number of tetramers. First, highlight the code line 45 that says circos.clear() and click &#x201c;Run.&#x201d; Next, go to code line 47 that says circos.par(gap.degree &#x3d; 1) and change gap.degree to a number less than 1 (panel G, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). This is a setting for the gaps between neighboring nodes. Larger values for gap.degree will create larger spacing between nodes and smaller values for gap.degree will create smaller spacing between nodes. Once gap.degree is changed to a smaller value, highlight the line along with the rest of the script and click &#x201c;Run.&#x201d; If the error occurs again, repeat the process of running circos.clear, changing gap.degree to an even smaller number and rerunning the script.</p>
</sec>
<sec id="s2-5">
<title>2.5 Customizing chord diagrams</title>
<p>To enhance the readability of large chord diagrams, it is sometimes preferable to shorten the node term label to an accession identifier (ID), as this further compacts the diagram by reducing the text. A label can be switched from &#x201c;node term&#x201d; to &#x201c;node ID&#x201d; easily by adding &#x201c;.ID&#x201d; as a suffix the end of the Chemical, Gene, Phenotype, or Disease variables (code lines 10&#x2013;13) in the section under &#x201c;&#x23; Prep data&#x201d; (panel J, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). Highlight the script beginning with this line along with the remaining script and click &#x201c;Run&#x201d;. Additional customization options can be found in the circlize documentation at <ext-link ext-link-type="uri" xlink:href="https://jokergoo.github.io/circlize_book/book/index.html">https://jokergoo.github.io/circlize_book/book/index.html</ext-link>.</p>
<p>The default selection of color palettes for CTD tetramer chord diagrams are blue (chemical), green (gene), purple (phenotype), and red (disease). If necessary, users can change these colors using code lines 37&#x2013;40 (panel K, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>). Each line of script for each of the four variables contains two colors. The script will create a palette from the first color listed to the second color. To change the color, simply edit the name in the code line, making sure the new color name is in quotation marks and the two colors are separated by a comma. There are many R color cheat sheets that can be found with an internet search to aid in choosing colors, including those that are specifically designed for users with color-vision deficiencies (<xref ref-type="bibr" rid="B3">Dahl et al., 2022</xref>).</p>
<p>A summary of the entire CTD-vizscript code is provided with information boxes showing the exact code lines that users can edit to customize the chord diagram output (panel L, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>).</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>3 Results</title>
<sec id="s3-1">
<title>3.1 Visualizing a single dataset of tetramers</title>
<p>To demonstrate how to transform a large dataset of CGPD-tetramers into a single chord diagram, we queried the CTD Tetramers tool (<ext-link ext-link-type="uri" xlink:href="https://ctdbase.org/query.go?type=tetramer">https://ctdbase.org/query.go?type&#x3d;tetramer</ext-link>) using &#x201c;metals&#x201d; as the chemical input, selecting the hierarchy filter to include any descendant terms, and &#x201c;liver neoplasms&#x201d; as the disease outcome. This yields 309 CGPD-tetramers, composed of two chemicals (copper and iron), 61 genes, and 87 phenotypes connected to liver neoplasms (<xref ref-type="fig" rid="F3">Figure 3</xref>). The web-based table result displays only the first 50 of the 309 CGPD-tetramers (but it can be set to display 500). The tabular output is downloaded from the webpage as a CSV file, and then following the step-by-step directions (see Methods), the CTD Tetramer results are processed to generate a chord diagram that depicts all 309 CGPD-tetramers in a single image (<xref ref-type="fig" rid="F3">Figure 3</xref>). Each chemical, gene, phenotype, and disease is represented as a colored node on the circumference of the circle, with chemicals shown in a blue palette, genes in a green palette, phenotypes in a purple palette, and diseases in a red palette. The arcs in the center of the circle connect the four nodes of each CGPD-tetramer, and are read in a clockwise manner: chemical (blue arc) to gene, gene (green arc) to phenotype, and phenotype (purple arc) to disease. The length of the node reflects the frequency that the specific data term occurs in the CGPD-tetramers and the width of the arc is proportional to the frequency that a dimer interaction occurs (<xref ref-type="fig" rid="F2">Figure 2</xref>). Larger nodes/arcs readily highlight the more commonly used data types, and visually indicate potentially important molecular players, such as the genes HMOX1, TP53, and TNF, and the phenotypes cell proliferation and cell cycle for metal-associated liver neoplasms (<xref ref-type="fig" rid="F3">Figure 3</xref>).</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>CTD Tetramer query results are returned as a web-page table, and the default display shows only the first 50 tetramers. Here, 309 tetramers relate two metals (copper and iron) with 61 genes and 87 phenotypes to the disease outcome of liver neoplasms. To survey all 309 tetramers on the web page, the user can scroll and click open additional web-pages or sort the pages by clicking on column headers. Our visualization method enhances this analysis by transforming and depicting all 309 CGPD-tetramers in a single chord diagram, allowing the user to more readily identify potentially key components of the dataset, due to the scaled dimensions of nodes/arcs in the graph, such as the indicated genes (TNF, TP53, and HMOX1) and phenotypes (cell proliferation and cell cycle). Nodes and their projecting arcs represent the directionality, are read clockwise, and are color-coded, initiating with chemicals (blue palette) to genes (green palette) to phenotypes (purple palette) and ending with diseases (red palette).</p>
</caption>
<graphic xlink:href="ftox-06-1437884-g003.tif"/>
</fig>
</sec>
<sec id="s3-2">
<title>3.2 Combining and visualizing multiple datasets of tetramers</title>
<p>Environmental health is a complex, multifactorial system wherein outcomes can be the result of chemical mixtures and of multiple, independent chemical exposures from different sources (<xref ref-type="bibr" rid="B8">Davis et al., 2023b</xref>). Thus, CTD users often query for and analyze different sets of CGPD-tetramers for different chemicals and then combine the data to look for overlaps between shared molecular mechanisms and diseases. To aid in such analysis, multiple tetramer query results can be combined into a single chord diagram. To merge query results, it is most straightforward to download the individual CSV files for each independent query, combine the files into a single CSV document (using Excel copy-and-paste), and then upload that single file as the data source for generating a chord diagram as described above.</p>
<p>For example, numerous environmental factors have been associated with male infertility, including phthalates, pesticides, and arsenic (<xref ref-type="bibr" rid="B18">Rodprasert et al., 2023</xref>). Three independent queries for CTD tetramers that relate the chemicals dibutyl phthalate, atrazine, and arsenic to male infertility can be combined into a single chord diagram to help identify potentially key genetic and phenotypic molecular mechanisms associated with these environmental stressors (<xref ref-type="fig" rid="F4">Figure 4</xref>). In total, these three independent queries yield 381 CGPD-tetramers composed of 37 genes and 124 phenotypes connecting the three chemicals to male infertility. Visualization of this complex environmental health dataset illuminates candidate genes (BAX, BCL2, and SOD2) and phenotypes (male gonad development, apoptosis, and spermatogenesis) connecting the chemicals to male infertility, and thus may represent critical intermediate molecular mechanisms (<xref ref-type="fig" rid="F4">Figure 4</xref>).</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption>
<p>Multiple sets of CTD tetramer query results can be combined into a single chord diagram. Here, dibutyl phthalate (DBP), atrazine (Atz), and arsenic (As) are independently queried for their association with male infertility (MI), resulting in three separate datasets of 123, 122, and 136 CGPD-tetramers for each chemical-disease query, respectively. The three outputs can be manually combined by the user into a single CSV file of 381 total tetramers. The visualization tool transforms the merged datasets into a single chord diagram, and the scaled dimensions of nodes/arcs help identify potentially important genetic (BAX, BCL2, and SOD2, green arrows) and phenotypic (male gonad development, apoptosis, and spermatogenesis, purple arrows) molecular mechanisms.</p>
</caption>
<graphic xlink:href="ftox-06-1437884-g004.tif"/>
</fig>
</sec>
<sec id="s3-3">
<title>3.3 Limitations</title>
<p>An impediment for visualizing CGPD-tetramers as a chord diagram is spacing constraints that limit the comprehensibility of these diagrams. We have found that about 1,500 tetramers tend to represent a practical upper limit for figure clarity. For larger datasets, there are a few options. As described above, customizing the node displays either using the &#x201c;cex&#x201d; parameter (for font size) or changing the label from &#x201c;term&#x201d; to &#x201c;node ID&#x201d; will significantly reduce the text (panel J, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>), resulting in a more compact diagram, but still enabling nodes to be readily identified. As well, the starting number of CGPD-tetramers to be graphed can be reduced preemptively by adding additional search parameters in the query to narrow the dataset to focus on a more specific question. For example, a query for &#x201c;liver neoplasms&#x201d; results in over 16,700 CGPD-tetramers, and represents a very broad open-ended question with respect to environmental health. However, when &#x201c;metals&#x201d; is included as the chemical parameter in the search, the number reduces to 309 (<xref ref-type="fig" rid="F3">Figure 3</xref>), and focuses on a more specific, addressable environmental health question. Alternatively, including phenotypes (e.g., &#x201c;nervous system process,&#x201d; &#x201c;inflammatory response&#x201d;, or &#x201c;metabolic process,&#x201d; with the filter option actively changed to include any descendant term) can also help focus questions and provide a more manageable number of CGPD-tetramers for analysis. Finally, CTD is also exploring ways to rank tetramers with a metric score as a means to prioritize the query results with the CGPD-tetramers that have the most supporting lines of evidence from the literature. Currently, the default display is alphabetical on the web-page results. Ranking would allow users to select tetramer subsets (instead of using the entire output) to include in their chord diagram.</p>
<p>Another limitation is the use of colors to represent information, as this may be an issue for those with color-vision deficiencies. Users can customize the plot colors to provide accessibility for specific color-vision deficiencies (<xref ref-type="bibr" rid="B3">Dahl et al., 2022</xref>) or for aesthetic purposes (panel K, <xref ref-type="sec" rid="s10">Supplemental File S2</xref>).</p>
<p>Finally, the obvious complicating factor to this approach is the manual effort required to download and transfer data files from CTD to an R environment in order to generate a chord diagram. Consequently, we plan to integrate similar functionality directly into CTD Tetramer query results pages in a future release.</p>
</sec>
</sec>
<sec sec-type="discussion" id="s4">
<title>4 Discussion</title>
<p>Advances are being made to provide clarity to complex environmental health data, including development and adoption of standardized vocabularies (<xref ref-type="bibr" rid="B15">Mattingly et al., 2016</xref>; <xref ref-type="bibr" rid="B12">Holmgren et al., 2023</xref>) and development of visual frameworks that display, organize, and integrate data from diverse sources. For example, the Aggregate Exposure Pathway (AEP) collates and structures chemical and biological knowledge at the population level to connect an environmental stressor with its source, medium, external/internal concentrations, and target site exposure (<xref ref-type="bibr" rid="B19">Teeguarden et al., 2016</xref>), while the Adverse Outcome Pathway (AOP) assembles information at the cellular level to link an initiating molecular event, a series of key processes, and an adverse outcome (<xref ref-type="bibr" rid="B1">Ankley and Edwards, 2018</xref>). Together, the AEP and AOP frameworks complement each other and connect population data to molecular data, respectively, helping to bridge the environmental health continuum (<xref ref-type="bibr" rid="B11">Hines, et al., 2018</xref>).</p>
<p>To harmonize environmental health data, CTD embraces community-accepted FAIR controlled vocabularies and ontologies to curate the scientific literature for both population exposure science (<xref ref-type="bibr" rid="B9">Grondin et al., 2016</xref>) and molecular/cellular laboratory results (<xref ref-type="bibr" rid="B7">Davis et al., 2011</xref>). This imperative step enables disparate data to be integrated to generate inferred relationships that provide potential mechanistic solutions for recognized knowledge gaps (<xref ref-type="bibr" rid="B4">Davis et al., 2008</xref>). CGPD-tetramers are a novel derivative of this integration strategy, where the combined data types are structured as a step-wise mechanistic pathway: a chemical first interacts with a gene to then modulate a phenotype that may contribute to a final disease outcome (<xref ref-type="bibr" rid="B5">Davis et al., 2020</xref>). Users can easily generate CGPD-tetramers for any environmental chemical, gene, phenotype, or disease of interest at CTD (<xref ref-type="bibr" rid="B8">Davis et al., 2023b</xref>); however, these queries typically bring back hundreds of results, in a web-based table.</p>
<p>To help survey and distill these large environmental health datasets, we present a simple visualization method that transforms CGPD-tetramers into a chord diagram, allowing all of the data to be condensed and viewed in a single, elegant figure. CGPD-tetramers are formatted and transformed using R. While our technique can be easily adopted by researchers already familiar with R, we provide step-by-step instructions for novice users, leveraging a free web-browser system that enables inexperienced users to generate publication-worthy chord diagrams for their own presentations. By their nature, chord diagrams show the interconnections between different data types and facilitate the visual identification of the most frequently used data components, allowing users to discern potentially important intermediate molecular mechanisms between an environmental exposure and a disease outcome. Graphing these complex, toxicology-related mechanistic pathways can help build, inform, or refine current AOPs (<xref ref-type="bibr" rid="B8">Davis et al., 2023b</xref>) and be used to provide visual mechanistic links to AEPs. Together, both the table-based version of CGPD-tetramers and the derived chord diagrams complement each other, with the former providing data in an easily sortable format and the latter providing a graphical view that helps to visually detect key data types.</p>
</sec>
</body>
<back>
<sec sec-type="data-availability" id="s5">
<title>Data availability statement</title>
<p>The datasets presented in this study can be found in online repositories. The names of the repository/repositories and accession number(s) can be found in the article/<xref ref-type="sec" rid="s10">Supplementary Material</xref>.</p>
</sec>
<sec id="s6">
<title>Author contributions</title>
<p>BW: Data curation, Investigation, Methodology, Validation, Writing&#x2013;original draft, Writing&#x2013;review and editing. AD: Conceptualization, Data curation, Investigation, Supervision, Validation, Visualization, Writing&#x2013;original draft, Writing&#x2013;review and editing. TW: Software, Writing&#x2013;review and editing. JW: Software, Writing&#x2013;review and editing. SA: Software, Writing&#x2013;review and editing. DS: Data curation, Writing&#x2013;review and editing. FB: Data curation, Writing&#x2013;review and editing. MS: Data curation, Writing&#x2013;review and editing. CM: Funding acquisition, Project administration, Writing&#x2013;review and editing.</p>
</sec>
<sec sec-type="funding-information" id="s7">
<title>Funding</title>
<p>The author(s) declare that financial support was received for the research, authorship, and/or publication of this article. National Institute of Environmental Health Sciences [U24 ES033155]. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health.</p>
</sec>
<ack>
<p>We thank Dr. Antonio Planchart for testing the methods and critically reviewing the manuscript.</p>
</ack>
<sec sec-type="COI-statement" id="s8">
<title>Conflict of interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<sec sec-type="disclaimer" id="s9">
<title>Publisher&#x2019;s note</title>
<p>All claims expressed in this article are solely those of the authors and do not necessarily represent those of their affiliated organizations, or those of the publisher, the editors and the reviewers. Any product that may be evaluated in this article, or claim that may be made by its manufacturer, is not guaranteed or endorsed by the publisher.</p>
</sec>
<sec id="s10">
<title>Supplementary material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/ftox.2024.1437884/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/ftox.2024.1437884/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet1.zip" id="SM1" mimetype="application/zip" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.pdf" id="SM2" mimetype="application/pdf" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Ankley</surname>
<given-names>G. T.</given-names>
</name>
<name>
<surname>Edwards</surname>
<given-names>S. W.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>The adverse outcome pathway: a multifaceted framework supporting 21st century toxicology</article-title>. <source>Curr. Opin. Toxicol.</source> <volume>9</volume>, <fpage>1</fpage>&#x2013;<lpage>7</lpage>. <pub-id pub-id-type="doi">10.1016/j.cotox.2018.03.004</pub-id>
</citation>
</ref>
<ref id="B2">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chai</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Zhao</surname>
<given-names>C.</given-names>
</name>
<name>
<surname>Jin</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zou</surname>
<given-names>P.</given-names>
</name>
<name>
<surname>Ling</surname>
<given-names>X.</given-names>
</name>
<etal/>
</person-group> (<year>2021</year>). <article-title>Generating adverse outcome pathway (AOP) of inorganic arsenic-induced adult male reproductive impairment via integration of phenotypic analysis in Comparative Toxicogenomics Database (CTD) and AOP wiki</article-title>. <source>Toxicol. Appl. Pharmacol.</source> <volume>411</volume>, <fpage>115370</fpage>. <pub-id pub-id-type="doi">10.1016/j.taap.2020.115370</pub-id>
</citation>
</ref>
<ref id="B3">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Dahl</surname>
<given-names>E. M.</given-names>
</name>
<name>
<surname>Neer</surname>
<given-names>E.</given-names>
</name>
<name>
<surname>Bowie</surname>
<given-names>K. R.</given-names>
</name>
<name>
<surname>Leung</surname>
<given-names>E. T.</given-names>
</name>
<name>
<surname>Karstens</surname>
<given-names>L.</given-names>
</name>
</person-group> (<year>2022</year>). <article-title>microshades: an R package for improving color accessibility and organization of microbiome data</article-title>. <source>Microbiol. Resour. Announc.</source> <volume>11</volume>, <fpage>e0079522</fpage>. <pub-id pub-id-type="doi">10.1128/mra.00795-22</pub-id>
</citation>
</ref>
<ref id="B4">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Murphy</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>Rosenstein</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Mattingly</surname>
<given-names>C. J.</given-names>
</name>
</person-group> (<year>2008</year>). <article-title>The Comparative Toxicogenomics Database facilitates identification and understanding of chemical-gene-disease associations: arsenic as a case study</article-title>. <source>BMC Med. Genomics.</source> <volume>1</volume>, <fpage>48</fpage>. <pub-id pub-id-type="doi">10.1093/database/bar034</pub-id>
</citation>
</ref>
<ref id="B5">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Grondin</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Sciaky</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>J.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Leveraging the Comparative Toxicogenomics Database to fill in knowledge gaps for environmental health: a test case for air pollution-induced cardiovascular disease</article-title>. <source>Toxicol. Sci.</source> <volume>177</volume>, <fpage>392</fpage>&#x2013;<lpage>404</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfaa113</pub-id>
</citation>
</ref>
<ref id="B6">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Sciaky</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Mattingly</surname>
<given-names>C. J.</given-names>
</name>
</person-group> (<year>2023a</year>). <article-title>Comparative toxicogenomics database (CTD): update 2023</article-title>. <source>Nucleic Acids Res.</source> <volume>51</volume>, <fpage>D1257</fpage>&#x2013;<lpage>D1262</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkac833</pub-id>
</citation>
</ref>
<ref id="B7">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Rosenstein</surname>
<given-names>M. C.</given-names>
</name>
<name>
<surname>Murphy</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>Mattingly</surname>
<given-names>C. J.</given-names>
</name>
</person-group> (<year>2011</year>). <article-title>The curation paradigm and application tool used for manual curation of the scientific literature at the Comparative Toxicogenomics Database</article-title>. <source>Database (Oxford)</source> <volume>2011</volume>, <fpage>bar034</fpage>. <pub-id pub-id-type="doi">10.1093/database/bar034</pub-id>
</citation>
</ref>
<ref id="B8">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>J. W.</given-names>
</name>
<name>
<surname>Wyatt</surname>
<given-names>B.</given-names>
</name>
<name>
<surname>Johnson</surname>
<given-names>R. J.</given-names>
</name>
<name>
<surname>Sciaky</surname>
<given-names>D.</given-names>
</name>
<etal/>
</person-group> (<year>2023b</year>). <article-title>CTD tetramers: a new online tool that computationally links curated chemicals, genes, phenotypes, and diseases to inform molecular mechanisms for environmental health</article-title>. <source>Toxicol. Sci.</source> <volume>195</volume>, <fpage>155</fpage>&#x2013;<lpage>168</lpage>. <pub-id pub-id-type="doi">10.1093/toxsci/kfad069</pub-id>
</citation>
</ref>
<ref id="B9">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Grondin</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Davis</surname>
<given-names>A. P.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>T. C.</given-names>
</name>
<name>
<surname>King</surname>
<given-names>B. L.</given-names>
</name>
<name>
<surname>Wiegers</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Reif</surname>
<given-names>D. M.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Advancing exposure science through chemical data curation and integration in the Comparative Toxicogenomics Database</article-title>. <source>Environ. Health Perspect.</source> <volume>124</volume>, <fpage>1592</fpage>&#x2013;<lpage>1599</lpage>. <pub-id pub-id-type="doi">10.1289/ehp174</pub-id>
</citation>
</ref>
<ref id="B10">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Gu</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Gu</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Eils</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Schlesner</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Brors</surname>
<given-names>B.</given-names>
</name>
</person-group> (<year>2014</year>). <article-title>Circlize Implements and enhances circular visualization in R</article-title>. <source>Bioinformatics</source> <volume>30</volume>, <fpage>2811</fpage>&#x2013;<lpage>2812</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu393</pub-id>
</citation>
</ref>
<ref id="B11">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hines</surname>
<given-names>D. E.</given-names>
</name>
<name>
<surname>Edwards</surname>
<given-names>S. W.</given-names>
</name>
<name>
<surname>Conolly</surname>
<given-names>R. B.</given-names>
</name>
<name>
<surname>Jarabek</surname>
<given-names>A. M.</given-names>
</name>
</person-group> (<year>2018</year>). <article-title>A case study application of the Aggregate Exposure Pathway (AEP) and Adverse Outcome Pathway (AOP) frameworks to facilitate the integration of human health and ecological end points for cumulative risk assessment (CRA)</article-title>. <source>Environ. Sci. Technol.</source> <volume>52</volume>, <fpage>839</fpage>&#x2013;<lpage>849</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.7b04940</pub-id>
</citation>
</ref>
<ref id="B12">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Holmgren</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Bell</surname>
<given-names>S. M.</given-names>
</name>
<name>
<surname>Wignall</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Duncan</surname>
<given-names>C. G.</given-names>
</name>
<name>
<surname>Kwok</surname>
<given-names>R. K.</given-names>
</name>
<name>
<surname>Cronk</surname>
<given-names>R.</given-names>
</name>
<etal/>
</person-group> (<year>2023</year>). <article-title>Workshop report: catalyzing knowledge-driven discovery in environmental health sciences through a harmonized language</article-title>. <source>Int. J. Environ. Res. Public Heath.</source> <volume>20</volume>, <fpage>2317</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph20032317</pub-id>
</citation>
</ref>
<ref id="B13">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jeong</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Kin</surname>
<given-names>D.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>J.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Integrative data mining approach: case study with adverse outcome pathway network leading to pulmonary fibrosis</article-title>. <source>Chem. Res. Toxicol.</source> <volume>36</volume>, <fpage>838</fpage>&#x2013;<lpage>847</lpage>. <pub-id pub-id-type="doi">10.1021/acs.chemrestox.2c00325</pub-id>
</citation>
</ref>
<ref id="B14">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Kim</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>S. H.</given-names>
</name>
<name>
<surname>Choi</surname>
<given-names>J. Y.</given-names>
</name>
<name>
<surname>Park</surname>
<given-names>Y. J.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Investigating fatty liver disease-associated adverse outcome pathways of perfluorooctane sulfonate using a systems toxicology approach</article-title>. <source>Food Chem. Toxicol.</source> <volume>176</volume>, <fpage>113781</fpage>. <pub-id pub-id-type="doi">10.1016/j.fct.2023.113781</pub-id>
</citation>
</ref>
<ref id="B15">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Mattingly</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Boyles</surname>
<given-names>R.</given-names>
</name>
<name>
<surname>Lawler</surname>
<given-names>C. P.</given-names>
</name>
<name>
<surname>Haugen</surname>
<given-names>A. C.</given-names>
</name>
<name>
<surname>Dearry</surname>
<given-names>A.</given-names>
</name>
<name>
<surname>Haendel</surname>
<given-names>M.</given-names>
</name>
</person-group> (<year>2016</year>). <article-title>Laying a community-based foundation for data-driven semantic standards in environmental health sciences</article-title>. <source>Environ. Health Perspect.</source> <volume>124</volume>, <fpage>1136</fpage>&#x2013;<lpage>1140</lpage>. <pub-id pub-id-type="doi">10.1289/ehp.1510438</pub-id>
</citation>
</ref>
<ref id="B16">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Nguyen</surname>
<given-names>H. D.</given-names>
</name>
<name>
<surname>Kim</surname>
<given-names>M.-S.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Interactions between cadmium, lead, mercury, and arsenic and depression: a molecular mechanism involved</article-title>. <source>J. Affect. Disord.</source> <volume>327</volume>, <fpage>315</fpage>&#x2013;<lpage>329</lpage>. <pub-id pub-id-type="doi">10.1016/j.jad.2023.02.013</pub-id>
</citation>
</ref>
<ref id="B17">
<citation citation-type="book">
<collab>R Core Team</collab> (<year>2018</year>). <source>R: a language and environment for statistical computing</source>. <publisher-loc>Vienna, Austria</publisher-loc>: <publisher-name>R Foundation for Statistical Computing</publisher-name>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.r-project.org/">https://www.r-project.org/</ext-link>.</comment>
</citation>
</ref>
<ref id="B18">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Rodprasert</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Toppari</surname>
<given-names>J.</given-names>
</name>
<name>
<surname>Virtanen</surname>
<given-names>H.</given-names>
</name>
</person-group> (<year>2023</year>). <article-title>Environmental toxicants and male fertility</article-title>. <source>Best. Pract. Res. Clin. Obstet. Gynaecol.</source> <volume>86</volume>, <fpage>102298</fpage>. <pub-id pub-id-type="doi">10.1016/j.bpobgyn.2022.102298</pub-id>
</citation>
</ref>
<ref id="B19">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Teeguarden</surname>
<given-names>J. G.</given-names>
</name>
<name>
<surname>Tan</surname>
<given-names>Y.-M.</given-names>
</name>
<name>
<surname>Edwards</surname>
<given-names>S. W.</given-names>
</name>
<name>
<surname>Leonard</surname>
<given-names>J. A.</given-names>
</name>
<name>
<surname>Anderson</surname>
<given-names>K. A.</given-names>
</name>
<name>
<surname>Gorley</surname>
<given-names>R. A.</given-names>
</name>
<etal/>
</person-group> (<year>2016</year>). <article-title>Completing the link between exposure science and toxicology for improved environmental health decision making: the Aggregate Exposure Pathway framework</article-title>. <source>Environ. Sci. Technol.</source> <volume>50</volume>, <fpage>4579</fpage>&#x2013;<lpage>4586</lpage>. <pub-id pub-id-type="doi">10.1021/acs.est.5b05311</pub-id>
</citation>
</ref>
<ref id="B20">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Thessen</surname>
<given-names>A. E.</given-names>
</name>
<name>
<surname>Grondin</surname>
<given-names>C. J.</given-names>
</name>
<name>
<surname>Kulkarni</surname>
<given-names>R. D.</given-names>
</name>
<name>
<surname>Brander</surname>
<given-names>S.</given-names>
</name>
<name>
<surname>Truong</surname>
<given-names>L.</given-names>
</name>
<name>
<surname>Vasilevsky</surname>
<given-names>N. A.</given-names>
</name>
<etal/>
</person-group> (<year>2020</year>). <article-title>Community approaches for integrating environmental exposures into human models of disease</article-title>. <source>Environ. Health Perspect.</source> <volume>128</volume>, <fpage>125002</fpage>. <pub-id pub-id-type="doi">10.1289/ehp7215</pub-id>
</citation>
</ref>
<ref id="B21">
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>Y.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>X.</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>Z.</given-names>
</name>
<name>
<surname>Huang</surname>
<given-names>W.</given-names>
</name>
<name>
<surname>Tang</surname>
<given-names>M.</given-names>
</name>
<name>
<surname>Du</surname>
<given-names>G.</given-names>
</name>
<etal/>
</person-group> (<year>2024</year>). <article-title>Hepatic toxicity prediction of bisphenol analogs by machine learning strategy</article-title>. <source>Sci. Total Environ.</source> <volume>934</volume>, <fpage>173420</fpage>. <pub-id pub-id-type="doi">10.1016/j.scitotenv.2024.173420</pub-id>
</citation>
</ref>
</ref-list>
</back>
</article>