<?xml version="1.0" encoding="UTF-8" standalone="no"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Front. Plant Sci.</journal-id>
<journal-title>Frontiers in Plant Science</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Front. Plant Sci.</abbrev-journal-title>
<issn pub-type="epub">1664-462X</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="doi">10.3389/fpls.2020.590949</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Plant Science</subject>
<subj-group>
<subject>Original Research</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>PhaeoNet: A Holistic RNAseq-Based Portrait of Transcriptional Coordination in the Model Diatom <italic>Phaeodactylum tricornutum</italic></article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Ait-Mohamed</surname> <given-names>Ouardia</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn002"><sup>&#x2020;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Nov&#x00E1;k Vanclov&#x00E1;</surname> <given-names>Anna M. G.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2021;</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Joli</surname> <given-names>Nathalie</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="author-notes" rid="fn003"><sup>&#x2021;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/733847/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Liang</surname> <given-names>Yue</given-names></name>
<xref ref-type="aff" rid="aff2"><sup>2</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Zhao</surname> <given-names>Xue</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Genovesio</surname> <given-names>Auguste</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Tirichine</surname> <given-names>Leila</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="aff" rid="aff3"><sup>3</sup></xref>
<xref ref-type="corresp" rid="c001"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/664173/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name><surname>Bowler</surname> <given-names>Chris</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<xref ref-type="corresp" rid="c002"><sup>&#x002A;</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/26015/overview"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Dorrell</surname> <given-names>Richard G.</given-names></name>
<xref ref-type="aff" rid="aff1"><sup>1</sup></xref>
<uri xlink:href="http://loop.frontiersin.org/people/761550/overview"/>
</contrib>
</contrib-group>
<aff id="aff1"><sup>1</sup><institution>Institut de Biologie de l&#x2019;Ecole Normale Sup&#x00E9;rieure (IBENS), Ecole Normale Sup&#x00E9;rieure, CNRS, INSERM, Universit&#x00E9; PSL</institution>, <addr-line>Paris</addr-line>, <country>France</country></aff>
<aff id="aff2"><sup>2</sup><institution>Department of Oceanography, Dalhousie University</institution>, <addr-line>Halifax, NS</addr-line>, <country>Canada</country></aff>
<aff id="aff3"><sup>3</sup><institution>Universit&#x00E9; de Nantes, CNRS, UFIP, UMR 6286</institution>, <addr-line>Nantes</addr-line>, <country>France</country></aff>
<author-notes>
<fn fn-type="edited-by"><p>Edited by: Justine Marchand, Le Mans Universit&#x00E9;, France</p></fn>
<fn fn-type="edited-by"><p>Reviewed by: Pannaga Pavan Jutur, International Centre for Genetic Engineering and Biotechnology, India; Yoshihisa Hirakawa, University of Tsukuba, Japan</p></fn>
<corresp id="c001">&#x002A;Correspondence: Leila Tirichine, <email>Leila.Tirichine@univ-nantes.fr</email></corresp>
<corresp id="c002">Chris Bowler, <email>cbowler@biologie.ens.fr</email></corresp>
<fn fn-type="other" id="fn002"><p><sup>&#x2020;</sup>Present address: Ouardia Ait-Mohamed, Immunity and Cancer Department, Institut Curie, PSL Research University, INSERM U932, Paris, France</p></fn>
<fn fn-type="other" id="fn003"><p><sup>&#x2021;</sup>These authors have contributed equally to this work</p></fn>
<fn fn-type="other" id="fn004"><p>This article was submitted to Marine and Freshwater Plants, a section of the journal Frontiers in Plant Science</p></fn>
</author-notes>
<pub-date pub-type="epub">
<day>16</day>
<month>10</month>
<year>2020</year>
</pub-date>
<pub-date pub-type="collection">
<year>2020</year>
</pub-date>
<volume>11</volume>
<elocation-id>590949</elocation-id>
<history>
<date date-type="received">
<day>03</day>
<month>08</month>
<year>2020</year>
</date>
<date date-type="accepted">
<day>15</day>
<month>09</month>
<year>2020</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#x00A9; 2020 Ait-Mohamed, Nov&#x00E1;k Vanclov&#x00E1;, Joli, Liang, Zhao, Genovesio, Tirichine, Bowler and Dorrell.</copyright-statement>
<copyright-year>2020</copyright-year>
<copyright-holder>Ait-Mohamed, Nov&#x00E1;k Vanclov&#x00E1;, Joli, Liang, Zhao, Genovesio, Tirichine, Bowler and Dorrell</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these terms.</p></license>
</permissions>
<abstract>
<p>Transcriptional coordination is a fundamental component of prokaryotic and eukaryotic cell biology, underpinning the cell cycle, physiological transitions, and facilitating holistic responses to environmental stress, but its overall dynamics in eukaryotic algae remain poorly understood. Better understanding of transcriptional partitioning may provide key insights into the primary metabolism pathways of eukaryotic algae, which frequently depend on intricate metabolic associations between the chloroplasts and mitochondria that are not found in plants. Here, we exploit 187 publically available RNAseq datasets generated under varying nitrogen, iron and phosphate growth conditions to understand the co-regulatory principles underpinning transcription in the model diatom <italic>Phaeodactylum tricornutum</italic>. Using WGCNA (Weighted Gene Correlation Network Analysis), we identify 28 merged modules of co-expressed genes in the <italic>P. tricornutum</italic> genome, which show high connectivity and correlate well with previous microarray-based surveys of gene co-regulation in this species. We use combined functional, subcellular localization and evolutionary annotations to reveal the fundamental principles underpinning the transcriptional co-regulation of genes implicated in <italic>P. tricornutum</italic> chloroplast and mitochondrial metabolism, as well as the functions of diverse transcription factors underpinning this co-regulation. The resource is publically available as PhaeoNet, an advanced tool to understand diatom gene co-regulation.</p>
</abstract>
<kwd-group>
<kwd>stramenopile</kwd>
<kwd>transcriptomics</kwd>
<kwd>sigma factors</kwd>
<kwd>aureochromes</kwd>
<kwd>epigenetics</kwd>
<kwd>chloroplast-mitochondria</kwd>
</kwd-group>
<contract-sponsor id="cn001">Centre National de la Recherche Scientifique<named-content content-type="fundref-id">10.13039/501100004794</named-content></contract-sponsor><contract-sponsor id="cn002">Chinese Government Scholarship<named-content content-type="fundref-id">10.13039/501100010890</named-content></contract-sponsor>
<counts>
<fig-count count="5"/>
<table-count count="0"/>
<equation-count count="0"/>
<ref-count count="122"/>
<page-count count="17"/>
<word-count count="0"/>
</counts>
</article-meta>
</front>
<body>
<sec id="S1">
<title>Introduction</title>
<p>The biology of prokaryotic and eukaryotic cells is dependent on elaborate metabolic, regulatory and gene expression pathways, consisting of multiple interacting components. The successful operation of these pathways depend on the coordinated expression of genes that underpin them, which allow the stoichiometric assembly of their constituent components and enable discrete and appropriate regulatory responses to changes in physiological conditions (<xref ref-type="bibr" rid="B42">Gasch and Eisen, 2002</xref>; <xref ref-type="bibr" rid="B109">Teichmann and Babu, 2002</xref>). In prokaryotes and bacteria-derived genomes (e.g., &#x201C;plastids&#x201D; including chloroplasts and mitochondria) gene co-regulation is possible via the co-transcription of linked genes as part of the same transcriptional operon (<xref ref-type="bibr" rid="B109">Teichmann and Babu, 2002</xref>). In contrast, gene order plays a limited role in eukaryotic nuclear gene co-expression (<xref ref-type="bibr" rid="B77">Michalak, 2008</xref>), which depends instead on the simultaneous transcription, or transcriptional stabilization, of multiple discrete genomic loci. This may occur through common transcription factors (<xref ref-type="bibr" rid="B109">Teichmann and Babu, 2002</xref>; <xref ref-type="bibr" rid="B94">Reja et al., 2015</xref>); epigenetic modifications based around characteristic histone and DNA marks (<xref ref-type="bibr" rid="B16">Bird, 2002</xref>; <xref ref-type="bibr" rid="B11">B&#x00E1;rtov&#x00E1; et al., 2008</xref>); co-ordinated transcript processing events (<xref ref-type="bibr" rid="B84">Norbury, 2010</xref>); and the activity of small and long regulatory non-coding RNAs (<xref ref-type="bibr" rid="B110">Tsai et al., 2010</xref>; <xref ref-type="bibr" rid="B62">Kim and Sung, 2012</xref>).</p>
<p>The degree to which gene co-regulation is shared between different species is debated, with different studies identifying shared co-regulatory trends in between 8% (<xref ref-type="bibr" rid="B109">Teichmann and Babu, 2002</xref>) and 70% (<xref ref-type="bibr" rid="B104">Snel et al., 2004</xref>) of orthologous gene pairs between <italic>Saccharomyces cerevisiae</italic> (yeast) and <italic>Caenorhabditis elegans</italic> (nematode) genomes. Nonetheless, there is substantial merit to understanding gene co-regulation patterns in novel species. Since their origins over two billion years ago, the eukaryotes have radiated into a diverse range of different lineages, many of which are unicellular; and distantly related to model organisms in the animals, fungi and plants, with different underlying cellular biology and transcriptional dynamics (<xref ref-type="bibr" rid="B115">Walker et al., 2011</xref>). Identifying what gene co-regulation processes occur in microbial eukaryotes may allow us to better understand the biology underpinning the base of planetary food webs; and to better model the robustness of eukaryotic communities to environmental change.</p>
<p>The diatoms are a major group of predominantly marine algae, believed to be responsible for nearly one-fifth of total planetary photosynthesis (<xref ref-type="bibr" rid="B39">Field et al., 1998</xref>). Diatoms sit within the stramenopile supergroup, and are distantly related to animals, fungi and plants. Photosynthetic members of the stramenopiles, including diatoms, possess a chloroplast acquired through secondary endosymbiosis, unlike the primary plant chloroplast, which is of primary endosymbiotic origin (<xref ref-type="bibr" rid="B115">Walker et al., 2011</xref>). Previous genomic and functional investigations of model diatoms, for example <italic>Phaeodactylum tricornutum</italic>, have identified divergent features in their cellular biology, compared to more well-understood eukaryotic groups (<xref ref-type="bibr" rid="B19">Bowler et al., 2010</xref>). These include intricate metabolic connections between the diatom chloroplast, mitochondria and cytoplasm (<xref ref-type="bibr" rid="B91">Prihoda et al., 2012</xref>; <xref ref-type="bibr" rid="B8">Bailleul et al., 2015</xref>); and a wide range of different histone structural modifications (<xref ref-type="bibr" rid="B113">Veluchamy et al., 2013</xref>, <xref ref-type="bibr" rid="B114">2015</xref>), many of which have not yet been detected in more established eukaryotic models.</p>
<p>Previously, microarray data from over 100 different conditions, including illumination regimes and pollutant stress (<xref ref-type="bibr" rid="B86">Osborn and Hook, 2013</xref>; <xref ref-type="bibr" rid="B112">Valle et al., 2014</xref>), have been generated from <italic>P. tricornutum</italic>; which have been assembled into a searchable interface, DiatomPortal that divides the <italic>P. tricornutum</italic> genome into 500 co-regulated gene clusters (<xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>). Alongside this, a suite of RNA sequencing libraries exploring cellular responses to phosphorus, iron and nitrogen limitation have now been generated (<xref ref-type="bibr" rid="B72">Maheswari et al., 2010</xref>; <xref ref-type="bibr" rid="B30">Cruz de Carvalho et al., 2016</xref>; <xref ref-type="bibr" rid="B103">Smith et al., 2016</xref>; <xref ref-type="bibr" rid="B76">McCarthy et al., 2017</xref>) and inspecting these data may allow more precise integration of quantitative differences in transcript abundance than would be possible through microarray analyses. Furthermore, co-expression networks are a powerful tool for functional prediction and annotation of unknown genes in the absence of prior knowledge, which is the case for a significant number of genes in <italic>P. tricornutum</italic> (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>). Co-expression networks can furthermore enrich our understanding of the more sparse co-expression networks generated for other marine algal species with secondary chloroplasts (principally, the distantly related diatom <italic>Thalassiosira pseudonana</italic>, the distantly related stramenopile <italic>Nannochloropsis oceanica</italic> and the haptophyte <italic>Emiliania huxleyi</italic>; <xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>; <xref ref-type="bibr" rid="B6">Ashworth and Ralph, 2018</xref>).</p>
<p>Here, we use a tool of gene co-expression network analysis, WGCNA (Weighted Gene Correlation Network Analysis (<xref ref-type="bibr" rid="B67">Langfelder and Horvath, 2008</xref>; <xref ref-type="bibr" rid="B48">Guidi et al., 2016</xref>), to build PhaeoNet, an advanced tool for transcriptional understanding of the <italic>P. tricornutum</italic> genome. PhaeoNet is composed of 28 co-regulated gene modules, each with different expression dynamics. Considering the repartition of genes within these modules; functional, epigenetic and localization information from the third version annotation of the <italic>P. tricornutum</italic> genome (Phatr3; <xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>); and annotated lists of diatom transcription factors (<xref ref-type="bibr" rid="B93">Rayko et al., 2010</xref>), we identify core features underpinning the transcriptional partitioning of diatom primary metabolism, including probable metabolic links between the diatom mitochondria and chloroplast; and dissect the diverse ranges of different transcriptional drivers of this co-regulation, notably in the case of chloroplast-targeted sigma factors. The raw data underpinning PhaeoNet have been made publically accessible via <ext-link ext-link-type="uri" xlink:href="https://osf.io/42xmp">https://osf.io/42xmp</ext-link>.</p>
</sec>
<sec id="S2" sec-type="materials|methods">
<title>Materials and Methods</title>
<sec id="S2.SS1">
<title>Dataset Curation and Abundance Calculations</title>
<p>A total of 187 publically available RNA-seq datasets from <italic>P. tricornutum</italic>, generated from three studies exploring, respectively, phosphorus (<xref ref-type="bibr" rid="B30">Cruz de Carvalho et al., 2016</xref>), iron (<xref ref-type="bibr" rid="B103">Smith et al., 2016</xref>) and nitrogen (<xref ref-type="bibr" rid="B76">McCarthy et al., 2017</xref>) stress transcriptional responses, were collected from the sequence read archive (SRA)<sup><xref ref-type="fn" rid="footnote1">1</xref></sup> (<xref ref-type="bibr" rid="B118">Wheeler et al., 2006</xref>). The 182 libraries that passed through quality control steps, were included in the final version of the WGCNA performed, are named per their names respective studies in <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>, sheet 1. Data provided in the phosphate and nitrogen conditions were obtained using an Illumina Genome Analyzer (<xref ref-type="bibr" rid="B14">Bentley et al., 2008</xref>), while the iron study used SOLiD technology sequencing (<xref ref-type="bibr" rid="B79">Morey et al., 2013</xref>). <italic>P. tricornutum</italic> transcript IDs from each study were mapped to gene models based on the Phatr3 annotation of the genome (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>, Sheet 2; <xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>).</p>
<p>Raw data were reprocessed using FastQC version v0.11.5<sup><xref ref-type="fn" rid="footnote2">2</xref></sup>. Low quality reads (Phred quality score below 20) were filtered-out using trim-galore version 0.5.0<sup><xref ref-type="fn" rid="footnote3">3</xref></sup>. The remaining sequences were aligned to the reference genome with the software package STAR version 2.5.3a (<xref ref-type="bibr" rid="B34">Dobin et al., 2013</xref>) (STAR &#x2013;outFilterMismatchNmax 2 &#x2013;outFilterMultimapNmax 1000 &#x2013;alignIntronMin 20 &#x2013;alignIntronMax 2000). The iron data derived from the SOLiD technology were first mapped using the Life Technologies LifeScope software suitable for data from such technology. For homogeneity purposes, the reads were remapped using the pre-cited version of STAR.</p>
<p>Expression levels of individual genes were obtained using featureCounts version 1.6.1 (<xref ref-type="bibr" rid="B70">Liao et al., 2014</xref>). Quality checks of datasets were performed using methods provided in DESeq2 version 1.19.37 (<xref ref-type="bibr" rid="B71">Love et al., 2014</xref>), with a PCA projection and a hierarchical dendrogram using Spearman correlation between library-normalized gene counts (<xref ref-type="bibr" rid="B44">Glasser and Winter, 1961</xref>). These subsequent analyses and results visualizations were performed using R package version 3.4.4.</p>
</sec>
<sec id="S2.SS2">
<title>Weighted Gene Correlation Network Analysis (WGCNA) and Network Visualization</title>
<p>The WGCNA R package (<xref ref-type="bibr" rid="B67">Langfelder and Horvath, 2008</xref>) was used to identify network modules from library-normalized gene expression values. First, a signed adjacency matrix (accepting oppositely correlated gene expression values to be clustered in the same modules) was obtained by calculating the pairwise Bi-weight mid-correlation coefficient from rij (<xref ref-type="bibr" rid="B67">Langfelder and Horvath, 2008</xref>), that represent expression values of genes i and j. A connectivity measure (k) per gene set was calculated by summing the connection strengths with other gene sets. Subsequently, the weighted adjacency matrix was obtained by raising the absolute value of the pairwise gene expression correlations to the soft-thresholding parameter &#x03B2; (<xref ref-type="bibr" rid="B120">Zhao et al., 2010</xref>). This achieved the scale-free topology criterion for WGCNA and typical for biological networks, emphasizing high correlations and minoring low ones, in which most nodes are not connected and only a few nodes are highly connected (<xref ref-type="bibr" rid="B10">Barab&#x00E1;si, 2009</xref>).</p>
<p>The scale-free topology of PhaeoNet was evaluated by the Scale-Free Topology Fitting Index (<italic>R</italic><sup>2</sup>), which was the square of the correlation between log[p(k)] and log(k). A &#x03B2; coefficient of 12 with <italic>R</italic><sup>2</sup> of 0.9 was used during the network building from the signed weighted adjacency matrix. The weighted adjacency matrix was finally used to calculate the Topological Overlap Matrix (TOM). Subsequently, modules were detected on the basis of the Topological Overlap measure using the following parameters: minModuleSize = 40 and mergeCutHeight = 0.25.</p>
<p>Graphical representations of the network were performed using Cytoscape (<xref ref-type="bibr" rid="B100">Shannon et al., 2003</xref>). All code used for the construction of PhaeoNet and interactive diagrams of each merged module are publically available through the following link: <ext-link ext-link-type="uri" xlink:href="https://osf.io/42xmp">https://osf.io/42xmp</ext-link>.</p>
</sec>
<sec id="S2.SS3">
<title>Biological Interpretation of Merged Modules</title>
<p>The distribution of <italic>P. tricornutum</italic> genes in each transcriptional module was compared to the distribution of orthologous gene models (Phatr2.0 genome annotation) in microarray-derived transcriptional clusters generated as part of the DiatomPortal project (<xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>). Only gene models that showed a one-to-one gene mapping (i.e., gene models that were neither split or merged, but including gene models that were truncated or extended) between version 2 (Phatr2) and version 3 (Phatr3) annotations of the <italic>P. tricornutum</italic> genome (<xref ref-type="bibr" rid="B18">Bowler et al., 2008</xref>; <xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>) were considered.</p>
<p>Biological functions within the merged modules were identified using gene functional annotations from the Phatr3 annotation of the <italic>P. tricornutum</italic> genome (<xref ref-type="bibr" rid="B18">Bowler et al., 2008</xref>; <xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>). These included: GO terms, using the R package TopGO (<xref ref-type="bibr" rid="B1">Aibar et al., 2015</xref>); PFAM domains and biological processes (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>); probable evolutionary affinities inferred by BLAST top hit analyses (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>); histone and DNA modifications associated with cells grown in replete media (<xref ref-type="bibr" rid="B113">Veluchamy et al., 2013</xref>, <xref ref-type="bibr" rid="B114">2015</xref>); Polycomb group protein marks (<xref ref-type="bibr" rid="B121">Zhao et al., 2020</xref>); and KEGG orthology predictions, obtained with BLASTkoala, Kofamkoala and GHOSTkoala servers (<xref ref-type="bibr" rid="B80">Moriya et al., 2007</xref>; <xref ref-type="bibr" rid="B55">Kanehisa, 2017</xref>; <xref ref-type="bibr" rid="B5">Aramaki et al., 2019</xref>; <xref ref-type="bibr" rid="B56">Kanehisa and Sato, 2020</xref>). <italic>In silico</italic> targeting predictions were performed for all N-complete protein sequences (i.e., protein sequences inferred to start in a methionine) within the dataset, using HECTAR (<xref ref-type="bibr" rid="B47">Gschloessl et al., 2008</xref>); ASAFind v2.0 (<xref ref-type="bibr" rid="B46">Gruber et al., 2015</xref>), in conjunction with SignalP v3.0 (<xref ref-type="bibr" rid="B13">Bendtsen et al., 2004</xref>); MitoFates, with a threshold detection value of 0.35 (<xref ref-type="bibr" rid="B41">Fukasawa et al., 2015</xref>; <xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>); and WolfPSort, taking the consensus best-scoring prediction using animal, fungi and plant reference datasets (<xref ref-type="bibr" rid="B51">Horton et al., 2007</xref>). Enrichments in each category were analyzed both qualitatively/manually and by a simple pivot table and chi-squared test. Tabulated lists of all annotations are presented in <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>.</p>
<p>Core chloroplast and mitochondria-associated functions were assembled from a list of 524 KEGG ortholog numbers based on previously identified chloroplast and mitochondria functions in photosynthetic eukaryotes (<xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>; <xref ref-type="bibr" rid="B82">Nonoyama et al., 2019</xref>; <xref ref-type="bibr" rid="B85">Nov&#x00E1;k Vanclov&#x00E1; et al., 2020</xref>). Where multiple candidate proteins were detected, proteins were assigned to either the chloroplast, mitochondria, or dual chloroplast/mitochondria (<xref ref-type="bibr" rid="B43">Gile et al., 2015</xref>; <xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>) based on <italic>in silico</italic> targeting predictions. Where no clear targeting predictions could be obtained, proteins were identified based on BLAST similarity to orthologous chloroplast- or mitochondria-targeted proteins from other algal and stramenopile species (<xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>; <xref ref-type="bibr" rid="B95">R&#x00ED;o B&#x00E1;rtulos et al., 2018</xref>). Disregarding 135 query proteins coded by organellar genomes in diatoms (<xref ref-type="bibr" rid="B119">Yu et al., 2018</xref>) and 17 query proteins encoded by nuclear genes with no PhaeoNet module assigned, the final set comprised of 372 unique proteins targeted to the chloroplast and/or mitochondrion, encoded by nuclear genes that belong to one of the 28 merged modules. The main metabolic pathways and complexes and quantitative pathway associations, are presented in <xref ref-type="supplementary-material" rid="TS3">Supplementary Table 3</xref>.</p>
<p>A complete list of <italic>P. tricornutum</italic> transcription factors (TF) was assembled from a previous dataset (<xref ref-type="bibr" rid="B93">Rayko et al., 2010</xref>) and an updated list specifically of aureochromes (<xref ref-type="bibr" rid="B9">Banerjee et al., 2016</xref>), which were mapped to the version 3 genome annotation by BLASTp analysis. A total of 188 candidates, from 18 TF families (HSF, Myb, Zn_finger_C2H2, bZIP, Zn_finger_CCCH, bHLH, Sigma-70, Zn_finger_TAZ, CBF/NF, E2F-DP, CSF, Aureochrome, TRF, CCAAT-binding, AP2-EREBP, TAF9, CXC, Homeobox) corresponded to genes assigned to a PhaeoNet merged module (<xref ref-type="fig" rid="F5">Figure 5</xref> and <xref ref-type="supplementary-material" rid="TS4">Supplementary Table 4</xref>). Given that the regulation of gene expression by transcription factors play a key role in the growth and progression of the cell cycle, the distribution within merged modules genes implicated in the cell cycle (cyclins) and in light perception events (e.g., phytochrome, cryptochrome) were additionally investigated, as well as genes implied in transcription and histone-related processes (<xref ref-type="fig" rid="F5">Figure 5</xref> and <xref ref-type="supplementary-material" rid="TS4">Supplementary Table 4</xref>; <xref ref-type="bibr" rid="B54">Huysman et al., 2013</xref>; <xref ref-type="bibr" rid="B4">Annunziata et al., 2019</xref>).</p>
</sec>
<sec id="S2.SS4">
<title>Phylogenetics</title>
<p>A tree of sigma factor proteins from <italic>P. tricornutum</italic> and orthologous diatom and non-diatom sequences was constructed using a pipeline adapted from previous studies (<xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>; <xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>). Briefly, the complete peptide sequences of each sigma factor protein (eight total) in the Phatr3 annotation of the <italic>P. tricornutum</italic> genome (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>) were searched using BLASTp against a composite library consisting of 110 diatom genomes, MMETSP (Marine Microbial Eukaryote Transcriptome Sequencing Project, <xref ref-type="bibr" rid="B60">Keeling et al., 2014</xref>) and independent transcriptomes; and a reference set of 59 additional eukaryotic genomes, sampled from across the tree of life (<xref ref-type="supplementary-material" rid="TS5">Supplementary Table 5</xref>). Orthologs with an <italic>e</italic>-value of 10<sup>&#x2013;05</sup> or lower were extracted and searched against the complete protein sequences encoded within the Phatr3 annotation of the <italic>P. tricornutum</italic> genome via reciprocal BLASTp searches. Sequences which retrieved a single best hit against a <italic>P. tricornutum</italic> sigma factor protein were aligned using MAFFT v 8.0 (<xref ref-type="bibr" rid="B57">Katoh et al., 2002</xref>) under the &#x2013;auto setting (BLOSUM62 matrix, gap open penalty 1.53, offset value 0) and the in-house alignment program in GeneIOUS v 10.0.9 (<xref ref-type="bibr" rid="B59">Kearse et al., 2012</xref>) using a more stringent set of conditions (65% similarity cost matrix, gap open penalty 12, gap extension penalty 3, two rounds of refinement). Poorly aligned or incomplete sequences were removed at each step. The 771 protein sequences retained were manually curated to retain a representative series of 86 diatom and non-diatom sequences related to each <italic>P. tricornutum</italic> sigma factor and trimmed using trimal with the &#x2013;gt 0.5 setting (<xref ref-type="bibr" rid="B24">Capella-Guti&#x00E9;rrez et al., 2009</xref>) to yield a 453 aa alignment. The best-scoring tree topology was inferred from the alignment using RAxML v8.2, 100 bootstrap replicates and the PROTGAMMAJTT substitution model (<xref ref-type="bibr" rid="B105">Stamatakis, 2014</xref>); and MrBayes v3.2.7 over 600,000 generations, burnin fractions of 0.5 and the Jones amino acid substitution model (<xref ref-type="bibr" rid="B52">Huelsenbeck and Ronquist, 2001</xref>). Alignment and tree outputs are provided in <xref ref-type="supplementary-material" rid="TS5">Supplementary Table 5</xref>.</p>
</sec>
</sec>
<sec id="S3">
<title>Results and Discussion</title>
<sec id="S3.SS1">
<title>Construction of an Optimized WGCNA Gene Expression Dataset for <italic>P. tricornutum</italic></title>
<p>We harnessed 187 publically available RNAseq datasets derived from diverse physiological conditions and genotypes (<xref ref-type="bibr" rid="B30">Cruz de Carvalho et al., 2016</xref>; <xref ref-type="bibr" rid="B103">Smith et al., 2016</xref>; <xref ref-type="bibr" rid="B76">McCarthy et al., 2017</xref>) to build an integrative model of gene co-regulation for the model diatom species <italic>P. tricornutum</italic> (<xref ref-type="fig" rid="F1">Figure 1A</xref> and <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>, sheet 1). We chose to build a dataset focusing on one species only, as even closely related diatom species may contain very different protein orthogroups (<xref ref-type="bibr" rid="B90">Parks et al., 2018</xref>; <xref ref-type="bibr" rid="B97">Sato et al., 2020</xref>) and even orthologous proteins may perform different physiological functions between different diatom species, with presumably different co-regulatory dynamics (<xref ref-type="bibr" rid="B66">Lampe et al., 2018</xref>). <italic>P. tricornutum</italic> was selected as a model system for this study as vastly greater amounts of gene expression data have been generated for this species than any other marine alga (<xref ref-type="bibr" rid="B6">Ashworth and Ralph, 2018</xref>); and as its genome annotation (currently in third version form and verified by comparison to over forty RNAseq libraries generated under varied conditions, <xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>) is arguably the most complete of any alga known, allowing unprecedented insight into protein diversity, including variant protein forms generated by alternative splicing, protein sub-cellular localization and epigenetic modifications. The use of RNAseq data for this analysis allows us to advance on previous (e.g., microarray-based, <xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>) analyses by allowing us to consider absolute rather than relative changes in expression levels between different datasets, and therefore exclude distorting effects caused by low absolute levels of the expression of specific genes in the <italic>P. tricornutum</italic> genome.</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption><p>Construction and topology of PhaeoNet. <bold>(A)</bold> Workflow diagram of the steps performed to construct PhaeoNet. <bold>(B)</bold> A Multi-Dimensional Scaling (MDS) plot of PhaeoNet. The dots correspond to genes and the colors correspond to the WGCNA modules. The tips of the plot correspond to hub genes of PhaeoNet. <bold>(C)</bold> Heatmap plot showing the TOM supplemented by the WGCNA module colors prior to merging. <bold>(D)</bold> Gene dendrogram of all incorporated PhaeoNet genes, obtained by average linkage hierarchical clustering. The first color row underneath the dendrogram shows the WGCNA module assignment obtained by the Dynamic Tree Cut method. The bottom color row shows the merged modules based on a correlation threshold of 0.75.</p></caption>
<graphic xlink:href="fpls-11-590949-g001.tif"/>
</fig>
<p>We optimized our data through several key pre-processing steps, for example removing batch effects (<xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 1A</xref>) and five samples showing strong outlier effects (exemplar shown in <xref ref-type="supplementary-material" rid="FS1">Supplementary Figure 1B</xref>) prior to network construction, retaining 182 datasets for the final network construction. We also excluded genes that were found to be lowly expressed (median expression &#x003C; 10 reads) in all inspected conditions, retaining 10,650/12,177 genes in the Phatr3 annotation (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>) of the <italic>P. tricornutum</italic> genome (<xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>, sheet 2). All pairwise gene correlations were calculated and then converted into connectivity strengths by raising their values to the power &#x03B2; = 12 for PhaeoNet. This power makes it possible to work in a scale-free condition and to avoid weak correlations (<xref ref-type="supplementary-material" rid="FS2">Supplementary Figure 2</xref>).</p>
<p>By applying the dynamic tree cut function on the dendrogram obtained by a hierarchical clustering with the method average, we identified 50 WGCNA modules with similar connection force profiles (<xref ref-type="fig" rid="F1">Figures 1B,C</xref>). This was reduced to a subset of 28 merged modules with internal correlations above 0.75 (<xref ref-type="fig" rid="F1">Figure 1D</xref>, <xref ref-type="supplementary-material" rid="TS1">Supplementary Table 1</xref>, sheet 2; and <xref ref-type="supplementary-material" rid="FS3">Supplementary Figure 3</xref>), in accordance with other WGCNA studies (<xref ref-type="bibr" rid="B67">Langfelder and Horvath, 2008</xref>; <xref ref-type="bibr" rid="B120">Zhao et al., 2010</xref>) and following validation by cross-referencing to independently derived gene co-regulation datasets for <italic>P. tricornutum</italic> (described below). The final version of PhaeoNet showed good overall cohesion within the merged modules, as inferrable by multi-dimensional-scaling projection (<xref ref-type="fig" rid="F1">Figure 1C</xref>) and correlation heatmaps of gene co-expression interconnectedness (<xref ref-type="fig" rid="F1">Figure 1B</xref>).</p>
<p>We present an exemplar merged module output (paleturquoise) in <xref ref-type="fig" rid="F2">Figure 2</xref>. A density heatmap, divided vertically by condition and horizontally by gene expression profile, shows a cohesive module as illustrated by stable values of first quantile, median, and third quantile values (<xref ref-type="fig" rid="F2">Figure 2A</xref>) and is defined by high levels of expression across the majority of the conditions explored (<xref ref-type="supplementary-material" rid="FS3">Supplementary Figure 3B</xref>). Cytoscape (<xref ref-type="bibr" rid="B100">Shannon et al., 2003</xref>) visualization of the network with a correlation threshold of 0.2 (<xref ref-type="fig" rid="F2">Figure 2B</xref>) demonstrates that the paleturquoise merged module is highly connected, showing a cluster of hub genes with high connectivity located in the central part of the network and only a small number of genes with limited connectivity. We provide detailed expression and Cytoscape data for each PhaeoNet merged module via <ext-link ext-link-type="uri" xlink:href="https://osf.io/42xmp">https://osf.io/42xmp</ext-link>.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption><p>Visualization and analysis of an exemplar PhaeoNet merged module (paleturquoise). <bold>(A)</bold> Density heatmap of all genes assigned to the paleturquoise merged module. The y-coordinate positions in the graph relate to density distribution of gene expression in each sample (shown on the left <italic>y</italic>-axis); the four middle dashed lines (indicated by horizontal arrows on either side of the graph) correspond to the median, first and third quantiles (shown on the right <italic>y</italic>-axis). The majority of the genes in this specific module show limited variation in expression profiles over different conditions samples. <bold>(B)</bold> A topological representation of connectedness within the paleturquoise merged module, visualized with Cytoscape (version 3.6.1). Each node represents a gene. Edges represent pairwise correlations between genes. The network shows all the paleturquoise module genes with a correlation value over a threshold of 0.20.</p></caption>
<graphic xlink:href="fpls-11-590949-g002.tif"/>
</fig>
</sec>
<sec id="S3.SS2">
<title>PhaeoNet Merged Modules Show Concordance With Microarray Co-regulation Data</title>
<p>We tested the reproducibility of our assignations, which may be considered as an independent measure of their robustness, by comparing the repartition of all <italic>P. tricornutum</italic> genes assigned to a PhaeoNet merged module with their corresponding distributions in 500 co-regulated clusters previously assembled from microarray data within the DiatomPortal server (<xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>; <xref ref-type="supplementary-material" rid="FS4">Supplementary Figure 4A</xref> and <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>). Across 7,751 assessable genes with both PhaeoNet and DiatomPortal assignations, we identified 4,127 (53%) that occurred in the same PhaeoNet merged module as another gene with the same DiatomPortal cluster assignation; and 2,751 genes (35%) that occurred within the single PhaeoNet merged module incorporating the greatest number of genes from the same DiatomPortal cluster. Both of these frequencies were judged to be significantly greater than expected through a random distribution (<italic>P</italic> = 0, one-tailed chi-squared test), suggesting strong concordance between both datasets.</p>
<p>From the 461 (83%) DiatomPortal clusters for which we could identify corresponding PhaeoNet merged modules, 369 (80%) were preferentially distributed in one PhaeoNet merged module only, with the greatest number of clusters associated with the darkgray merged module (79 clusters), blue (46 clusters) and cyan (44 clusters) merged modules, reflecting the greater size of each merged module (<xref ref-type="supplementary-material" rid="FS4">Supplementary Figure 4A</xref> and <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>). No DiatomPortal clusters were found to be incorporated preferentially into the bisque4, darkmagenta, greenyellow, gray, lightsteelblue1 and mediumpurple3 PhaeoNet merged modules. It is possible that these merged modules represent transcriptional networks not visualized within DiatomPortal due to the different source datasets, generated using different techniques (e.g., microarray versus RNAseq data, assembled with hierarchical clustering versus WGCNA; <xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>), which may influence what genes are inferred to be coexpressed using each analysis.</p>
<p>We also verified the number of associations independently found between pairs of genes in DiatomPortal clusters and PhaeoNet modules generated with independent merging thresholds, as an independent test of the appropriateness of our selected 0.75 merging threshold (<xref ref-type="supplementary-material" rid="FS4">Supplementary Figure 4B</xref>). We found greater concordance between DiatomPortal and PhaeoNet modules generated with a 0.75 merging threshold, as in our methodology, than in unmerged WGCNA modules, or modules merged with higher (0.8) or lower (0.7) threshold values (<xref ref-type="supplementary-material" rid="FS4">Supplementary Figure 4B</xref>).</p>
</sec>
<sec id="S3.SS3">
<title>Different PhaeoNet Merged Modules Perform Different Biological Activities in the <italic>P. tricornutum</italic> Cell</title>
<p>Next, we profiled the predominant biological activities associated with each merged module by calculating enrichment scores for different functional, subcellular targeting and evolutionary annotations across the <italic>P. tricornutum</italic> genome (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>; <xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>). A full set of protein annotations <italic>P. tricornutum</italic>, including PhaeoNet module assignations, inferred functions, predicted localization and inferred evolutionary origin, is provided for user exploration in <xref ref-type="supplementary-material" rid="TS2">Supplementary Table 2</xref>.</p>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption><p>Biological properties associated with PhaeoNet merged modules. This Figure provides an overview of enrichments of different organelle targeting (<xref ref-type="bibr" rid="B51">Horton et al., 2007</xref>; <xref ref-type="bibr" rid="B47">Gschloessl et al., 2008</xref>; <xref ref-type="bibr" rid="B41">Fukasawa et al., 2015</xref>; <xref ref-type="bibr" rid="B46">Gruber et al., 2015</xref>), epigenetic (<xref ref-type="bibr" rid="B113">Veluchamy et al., 2013</xref>, <xref ref-type="bibr" rid="B114">2015</xref>; <xref ref-type="bibr" rid="B121">Zhao et al., 2020</xref>), evolutionary (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>) and KEGG pathway annotations (<xref ref-type="bibr" rid="B55">Kanehisa, 2017</xref>) enriched in merged modules. The first seven (shaded) columns provide a score for different conditions, aggregated from chi-squared P-values of multiple enrichment predictors (defined beneath): enrichments in each condition carry a score of +1 if significant to <italic>P</italic> &#x003C; 0.05 and +2 if significant to <italic>P</italic> &#x003C; 10<sup>&#x2013;05</sup>; and depletions in each condition carry a score of &#x2013;1 if significant to <italic>P</italic> &#x003C; 0.05 and &#x2013;2 if significant to <italic>P</italic> &#x003C; 10<sup>&#x2013;05</sup>, assessed by chi-squared test against a null hypothesis of a random distribution of these features across all genes assigned to a PhaeoNet merged module. The final column lists all metabolic pathways enriched to <italic>P</italic> &#x003C; 0.05, or <italic>P</italic> &#x003C; 10<sup>&#x2013;05</sup> (asterisked) for each merged module, assessed by chi-squared test as above. Verbose outputs for each set of conditions are provided in <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>. Additional annotations, e.g., enrichments in inferred evolutionary origins of each merged module, are provided for user exploration in <xref ref-type="supplementary-material" rid="TS2">Supplementary Table S2</xref>.</p></caption>
<graphic xlink:href="fpls-11-590949-g003.tif"/>
</fig>
<p>We identified seven major subsets of merged modules with different biological properties. The first subset consists of merged modules (blue, lightcyan1, lightsteelblue1 and salmon) associated with the chloroplast [either genes encoding chloroplast-targeted proteins, inferred with ASAFind (<xref ref-type="bibr" rid="B46">Gruber et al., 2015</xref>) or HECTAR (<xref ref-type="bibr" rid="B47">Gschloessl et al., 2008</xref>), or of inferred red algal origin in a previous BLAST top hit analysis of the <italic>P. tricornutum</italic> genome (<xref ref-type="bibr" rid="B92">Rastogi et al., 2018</xref>)]. We included proteins of red algal origin as an independent estimator of chloroplastic origin, as the vast majority of red algal protein in <italic>P. tricornutum</italic> likely derive from the diatom chloroplast endosymbiont (<xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>) and to allow us to detect chloroplast-associated proteins that elude <italic>in silico</italic> targeting prediction (<xref ref-type="bibr" rid="B82">Nonoyama et al., 2019</xref>; <xref ref-type="bibr" rid="B98">Schober et al., 2019</xref>). These merged modules were also enriched (as inferred with KEGG analysis (<xref ref-type="bibr" rid="B55">Kanehisa, 2017</xref>) in genes related to photosynthesis, carbon-fixation and core biosynthetic pathways (e.g., amino acid and pigment biosynthesis) associated with diatom chloroplasts (<xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>; <xref ref-type="bibr" rid="B82">Nonoyama et al., 2019</xref>). Nearly all of the merged modules within this subset were enriched in activating histone marks (e.g., H3K9Ac and H3K14Ac) and depleted in repressive marks (e.g., H3K9me2 and H3K27me3) in cultures grown under replete media conditions (<xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>; <xref ref-type="bibr" rid="B114">Veluchamy et al., 2015</xref>; <xref ref-type="bibr" rid="B121">Zhao et al., 2020</xref>), consistent with high levels of expression. Each of the chloroplast-enriched modules contained enrichments in different KEGG functions (discussed below), although only one of these modules (blue) was enriched in proteins containing at least one KEGG annotation (<xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>); and, in any case, all merged modules contain substantial numbers (between 18%, bisque4; and 54%, violet).</p>
<p>A second parallel set of merged modules (floralwhite, magenta, mediumpurple3, and orangered4), which was also found to be enriched in activating histone marks, was enriched in genes encoding mitochondria-targeted proteins (inferred with MitoFates, HECTAR and WolfPSort (<xref ref-type="bibr" rid="B51">Horton et al., 2007</xref>; <xref ref-type="bibr" rid="B47">Gschloessl et al., 2008</xref>; <xref ref-type="bibr" rid="B41">Fukasawa et al., 2015</xref>) and mitochondria-associated functions (e.g., oxidative phosphorylation and pyruvate metabolism; <xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>). Of note, the paleturquoise merged module was uniquely enriched in genes encoding both chloroplast and mitochondria-targeted proteins, suggesting a probable hub between both organelle functions (<xref ref-type="fig" rid="F3">Figure 3</xref>).</p>
<p>We identified three further subsets of merged modules that were enriched in cytoplasmic or nuclear processes involved in metabolism (black, cyan, orange, and tan); genome-associated processes including transcription, translation and genome repair (bisque4, steelblue, ivory and violet); or cellular processes including protein modification, protein trafficking and the cell cycle (brown4, darkgray, and red; <xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>). Certain merged modules contained a mixture of genes encoding both metabolic and non-metabolic proteins: amongst other examples, the steelblue merged module was found to be enriched both in genes encoding proteins associated with ribosome and tRNA biogenesis and also in genes encoding enzymes involved in purine and pyrimidine metabolism, suggesting a probable transcriptional coordination of nucleotide biosynthesis to translational activity in <italic>P. tricornutum</italic> cells (<xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>). A sixth subset of merged modules (darkgreen, darkmagenta and darkslateblue) showed no obvious enrichment in any KEGG function or organelle localization, except for a possible enrichment in peroxisomal functions in the darkgreen merged module (<xref ref-type="bibr" rid="B32">Davis et al., 2017</xref>).</p>
<p>The final merged module subset (brown, green, greenyellow, gray, and skyblue) was uniquely enriched in repressive histone marks and depleted in activating histone marks, in cultures grown on replete media (<xref ref-type="fig" rid="F3">Figure 3</xref>; <xref ref-type="bibr" rid="B114">Veluchamy et al., 2015</xref>). These merged modules may either be constitutively repressed in <italic>P. tricornutum</italic> cells, or might lose their repressive histone marks and be expressed in alternative conditions to the replete culture conditions in which the epigenetic datasets were collected (<xref ref-type="bibr" rid="B121">Zhao et al., 2020</xref>). We noted that the greenyellow merged module, for example, was enriched in proteins with at least one KEGG annotation; and the skyblue merged module was found to be significantly enriched in genes encoding proteins involved in carbon fixation, the TCA cycle and propionate metabolism (<xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>). Further studies of the epigenetic marks associated with these modules, including under physiological conditions in which they are most highly expressed (<xref ref-type="supplementary-material" rid="FS3">Supplementary Figure 3</xref>) will be necessary to determine under what circumstances the genes they contain make significant contributions to <italic>P. tricornutum</italic> biology.</p>
</sec>
<sec id="S3.SS4">
<title>PhaeoNet Merged Modules Reveal Transcriptional Co-regulation in <italic>P. tricornutum</italic> Chloroplast and Mitochondrial Metabolism</title>
<p>Having noticed specific biases in the distribution of mitochondria- and chloroplast-targeted proteins within our dataset and given the distinctive organelle metabolism noted in diatoms compared to plants (<xref ref-type="bibr" rid="B63">Kroth et al., 2008</xref>; <xref ref-type="bibr" rid="B82">Nonoyama et al., 2019</xref>; <xref ref-type="bibr" rid="B102">Smith et al., 2019</xref>), we wished to identify which key chloroplast and mitochondrial functions are revealed by PhaeoNet to be transcriptionally coordinated with one another. We searched the distribution of 372 manually curated nuclear-encoded proteins with known chloroplast- and mitochondria-associated functions and localizations (<xref ref-type="fig" rid="F4">Figure 4</xref>, <xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>, and <xref ref-type="supplementary-material" rid="TS3">Supplementary Table 3</xref>). At least one gene encoding one such protein of each merged module was present in this set, however, only 12 merged modules contained more than 10 genes and amounted to 83% of the set.</p>
<fig id="F4" position="float">
<label>FIGURE 4</label>
<caption><p>Main metabolic pathways and functional complexes of <italic>P. tricornutum</italic> plastid <bold>(left)</bold> and mitochondrion <bold>(right)</bold> and their composition in regard to PhaeoNet merged modules. Each square represents a gene encoding a protein identified either from N-terminal targeting predictions to function in the chloroplast or mitochondrion. Clusters of adjacent squares pertain to genes encoding different components of a specific multi-unit enzyme or complex; and split squares pertain to genes encoding functional homologs of one specific protein. The assigned merged modules are indicated as their respective colors, with the 16 most abundant merged modules shown in the legend. Additionally, proteins coded in organellar genomes (<xref ref-type="bibr" rid="B88">Oudot-Le Secq et al., 2007</xref>; <xref ref-type="bibr" rid="B87">Oudot-Le Secq and Green, 2011</xref>; <xref ref-type="bibr" rid="B119">Yu et al., 2018</xref>) are shown as dotted green or red; proteins for which chloroplast- or mitochondria-targeted isoforms or merged modules could not be assigned are shown as light gray; and enzymatic steps not identified in the genome are shown as light gray squares without borders. Dual-localized proteins (<xref ref-type="bibr" rid="B43">Gile et al., 2015</xref>; <xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>) are marked by checkered yellow boxes; while orange boxes highlight potential connection points between the two organelles. Abbreviations are as follows: CAs, carbonic anhydrases; MEP/DOXP, mevalonate and non-mevalonate pathways for isoprenoid biosynthesis; SUF, iron-sulfur complex assembly; MPP,/TPP/SPP, mitochondrial, thylakoid and stromal processing peptidases; TAT, twin-arginine-dependent thylakoid protein import pathways; AOX/PTOX, mitochondrial and chloroplast alternative oxidases; TCA, Citric Acid cycle; Orn, ornithine; GCS, glycine shuttle; GS-GOGAT, glutamine synthetase/glutamate synthase shuttle. Detailed enzyme distributions for each pathway are shown in <xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>.</p></caption>
<graphic xlink:href="fpls-11-590949-g004.tif"/>
</fig>
<p>The most abundantly represented merged module (blue, 69 chloroplast or mitochondrial occurrences) was clearly associated with genes encoding chloroplast anabolic reactions, containing enzymes associated with the Calvin&#x2013;Benson&#x2013;Bassham (CBB) cycle, chloroplast-targeted glycolysis/gluconeogenesis (<xref ref-type="bibr" rid="B63">Kroth et al., 2008</xref>) and fatty acid synthesis (<xref ref-type="bibr" rid="B74">Mar&#x00E9;chal and Lupette, 2020</xref>), along with theta-class carbonic anhydrases that mediate biophysical carbon concentrating mechanisms in diatom chloroplasts (<xref ref-type="fig" rid="F4">Figure 4</xref> and <xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>; <xref ref-type="bibr" rid="B61">Kikutani et al., 2016</xref>; <xref ref-type="bibr" rid="B82">Nonoyama et al., 2019</xref>). The blue merged module additionally contained genes encoding chloroplast-targeted proteins implicated in photoprotection, including the diatom xanthophyll cycle (e.g., Phatr3_J51703 encoding violaxanthin de-epoxidase; <xref ref-type="bibr" rid="B40">Frommolt et al., 2008</xref>; <xref ref-type="bibr" rid="B31">Dautermann and Lohr, 2017</xref>), tocopherol synthesis (e.g., Phatr3_J20470, encoding tocopherol cyclase; <xref ref-type="bibr" rid="B33">D&#x0142;u&#x017C;ewska et al., 2016</xref>; <xref ref-type="bibr" rid="B82">Nonoyama et al., 2019</xref>) and two genes (Phatr3_J27278 and Phatr3_J44733) encoding LhcX-class chlorophyll-binding proteins, associated with high- and low-light adaptation responses in diatoms (<xref ref-type="supplementary-material" rid="TS2">Supplementary Tables 2</xref>, <xref ref-type="supplementary-material" rid="TS3">3</xref>; <xref ref-type="bibr" rid="B106">Taddei et al., 2016</xref>; <xref ref-type="bibr" rid="B23">Buck et al., 2019</xref>).</p>
<p>Genes encoding photosynthetic metabolism enzymes were concentrated in the lightcyan1 (41 occurrences) and lightsteelblue1 merged modules (19 occurrences). The lightcyan1 merged module included genes encoding LhcF-, LhcR-, and chlorophyll a/b-binding proteins, which are typically considered not to be involved in light stress responses (<xref ref-type="bibr" rid="B49">Gundermann et al., 2013</xref>; <xref ref-type="bibr" rid="B22">B&#x00FC;chel, 2015</xref>) and nucleus-encoded subunits of photosystems I, II and cytochrome c<sub>6</sub> (<xref ref-type="bibr" rid="B45">Grouneva et al., 2011</xref>; <xref ref-type="bibr" rid="B96">Roncel et al., 2016</xref>); whereas the lightsteeblue1 merged module contained the majority of genes involved in diatom chlorophyll and isoprenoid synthesis (<xref ref-type="bibr" rid="B15">Bertrand, 2010</xref>; <xref ref-type="bibr" rid="B29">Cihlar et al., 2016</xref>). We noted the presence of two genes encoding enzymes involved in pigment biosynthesis, respectively carotenoids (Phatr3_J21829, encoding 2-C-methyl-D-erythritol 4-phosphate cytidylyltransferase) and chlorophyll (Phatr3_J30690, encoding 3,8-divinyl protochlorophyllide-a 8-vinyl reductase (<xref ref-type="bibr" rid="B116">Wang et al., 2010</xref>) in the lightcyan1 merged module (<xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>). We also noted the presence of the gene Phatr3_J47674 encoding the iron stress-induced protein ISIP3 within the lightcyan1 merged module, which may point to a functional role for this protein in chloroplast photosystem assembly (<xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>; <xref ref-type="bibr" rid="B2">Allen et al., 2008</xref>; <xref ref-type="bibr" rid="B26">Chappell et al., 2015</xref>).</p>
<p>Genes encoding mitochondrial respiratory chain proteins were concentrated toward the orangered4 merged module (27 occurrences), whereas, genes encoding TCA cycle enzymes were concentrated toward the cyan merged module (34 occurrences). The orangered4 merged module also contained large numbers of genes encoding mitochondrial ribosomal proteins, which may relate to redox-state dependent regulation of mitochondrial biogenesis pathways (<xref ref-type="bibr" rid="B3">Allen, 2003</xref>). In contrast, most genes encoding chloroplast biogenesis-related proteins were identified in separate PhaeoNet merged modules to genes encoding proteins of the photosystem core, with significant enrichments of genes encoding chloroplast ribosomal proteins in the ivory merged module (otherwise enriched in chloroplast branched-chain amino acid and lysine biosynthesis (<xref ref-type="bibr" rid="B21">Bromke, 2013</xref>). It remains to be determined to what extent the expression of the chloroplast- and mitochondrial-genomes of <italic>P. tricornutum</italic> are regulated in response to the redox state, versus metabolic fluxes experienced in both organelles.</p>
<p>Finally, we considered the repartition of functionally uncharacterized, but conserved domains across chloroplast-targeted proteins in our dataset, focusing on DUFs (Domains of Unknown Function). We found 30 chloroplast-targeted proteins containing at least one DUF and 8 DUFs assigned to at least two chloroplast-targeted proteins (<xref ref-type="supplementary-material" rid="TS3">Supplementary Table 3</xref>, Sheet 2). Amongst these recurrent chloroplast-associated DUFs were two examples (DUF1995 and DUF3493), which have previously been implicated to function in photosystem assembly within thylakoid membranes (<xref ref-type="bibr" rid="B28">Chi et al., 2012</xref>; <xref ref-type="bibr" rid="B17">Bohne et al., 2016</xref>; <xref ref-type="bibr" rid="B69">Li et al., 2019</xref>). Both of these DUFs were found amongst chloroplast-targeted proteins in the paleturquoise merged module (Phatr3_J38149, Phatr3_J40136, and Phatr3_J46926, containing DUF1995; and Phatr3_EG02444, containing DUF3493); in the blue module (Phatr3_J44212, containing DUF1995; and Phatr3_J45569, containing DUF3494); and DUF1995 furthermore occurred in chloroplast-targeted proteins in the lightcyan1 (Phatr3_J44529) and lightsteelblue (Phatr3_J40199) modules (<xref ref-type="supplementary-material" rid="TS3">Supplementary Table 3</xref>, Sheet 2). Each of these modules are enriched in different chloroplast-targeted metabolism pathways (<xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F4">4</xref>), suggesting complex connections between the regulation of chloroplast anabolism and photosystem assembly.</p>
<p>Amongst the other DUFs associated with more than one chloroplast-targeted protein were DUF814, which is implicated in RNA quality control and amongst <italic>P. tricornutum</italic> chloroplast-targeted protein includes one (Phatr3_J45207, within the paleturquoise module) with some structural homology to a ferrous iron transporter (<xref ref-type="bibr" rid="B75">Maxwell Burroughs and Aravind, 2014</xref>); and DUF563, which contains a carbohydrate-active domain (<xref ref-type="bibr" rid="B89">Park et al., 2010</xref>) and includes at least one chloroplast-targeted protein (Phatr3_EG00581) within the blue module, otherwise implicated in chloroplast carbon metabolism (<xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F4">4</xref>). It remains to be determined if either of these proteins has novel functions, e.g., respectively in iron status sensing or in the diversification of carbohydrate metabolism in the <italic>P. tricornutum</italic> chloroplast, via the generating and phenotyping of mutant lines.</p>
</sec>
<sec id="S3.SS5">
<title>PhaeoNet Merged Modules Identify Complex Crosstalk between the Chloroplast and Mitochondrion in <italic>P. tricornutum</italic></title>
<p>Previously, intricate metabolic connections have been observed between <italic>P. tricornutum</italic> chloroplasts and mitochondria, which are distinctive to those found in plants (<xref ref-type="bibr" rid="B91">Prihoda et al., 2012</xref>; <xref ref-type="bibr" rid="B8">Bailleul et al., 2015</xref>; <xref ref-type="bibr" rid="B20">Broddrick et al., 2019</xref>; <xref ref-type="bibr" rid="B81">Murik et al., 2019</xref>). We wished to determine which of these connections were visible within our data, noting multiple, transcriptionally independent connections between the predicted proteomes of chloroplasts and mitochondria in PhaeoNet data (highlighted in <xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>). These included the presence of genes encoding chloroplast-targeted protein import subunits (e.g., Phatr3_J32195 encoding Tic20, Phatr3_EG02421 encoding Tic21) within the otherwise predominantly mitochondrial orangered4 merged module and the presence of large numbers of amino-acyl tRNA synthetase genes (which are typically dual-targeted to the chloroplasts and mitochondria in diatoms (<xref ref-type="bibr" rid="B43">Gile et al., 2015</xref>; <xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>, <xref ref-type="bibr" rid="B35">2019</xref>) in the otherwise chloroplast-associated blue merged module.</p>
<p>We furthermore noted the presence of multiple chloroplast-targeted proteins associated with chloroplast division (e.g., Phatr3_J34093, Phatr3_J42361, and Phatr3_J14995, encoding FtsZ-type division proteins) in the blue module, potentially linking the synthesis of chloroplast and mitochondrial tRNAs to chloroplast replication. A further two proteins implicated in chloroplast replication (e.g., Phatr3_J21455, encoding a dynamin-related DRPB85-class protein and Phatr3_J14426, encoding a further FtsZ protein)&#x2014;were found in the darkgray module, which was also populated by proteins involved in mitochondrial protein import (MPP, TIM, OXA1; <xref ref-type="supplementary-material" rid="TS3">Supplementary Table 3</xref>), suggesting probable links between chloroplast and mitochondrial biogenesis. Of note, at least two of the FtsZ proteins (Phatr3_J34093, within the blue module and Phatr3_J14426, within the darkgray module) were inferred to possess both chloroplast and mitochondrial-targeting sequences, underpinning the likely coordination of biogenesis of both organelles (<xref ref-type="supplementary-material" rid="TS3">Supplementary Table 3</xref>). This coordination may underpin the close topological associations and synchronized division cycles observed between the <italic>P. tricornutum</italic> mitochondrion and chloroplast observed <italic>in vivo</italic> (<xref ref-type="bibr" rid="B108">Tanaka et al., 2015</xref>; <xref ref-type="bibr" rid="B36">Dorrell and Bowler, 2017</xref>).</p>
<p>Alongside these more general links, we identified specific points of co-regulation between each organelle. The paleturquoise merged module, as the only merged module found to be enriched in both chloroplast and mitochondria functions (<xref ref-type="fig" rid="F3">Figure 3</xref>) was of particular interest and contained genes encoding enzymes participating in several different chloroplast and mitochondria metabolic pathways. These included genes for mitochondria-targeted glycine dehydrogenase (Phatr3_J22187) and serine hydroxymethyltransferase (Phatr3_J32847) and a gene for a chloroplast-targeted dihydrolipoamide dehydrogenase (Phatr3_J30113), which participate (as part of the glycine shuttle) in metabolic recycling of 2-P-glycolate produced through photosynthesis (<xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>; <xref ref-type="bibr" rid="B122">Zheng et al., 2013</xref>; <xref ref-type="bibr" rid="B32">Davis et al., 2017</xref>). The paleturquoise merged module additionally contains a gene encoding mitochondria-targeted malate dehydrogenase (Phatr3_J54082), which may additionally participate in the photorespiratory metabolism of glycolate by allowing the recycling of mitochondrial serine (via pyruvate) in the TCA cycle (<xref ref-type="bibr" rid="B32">Davis et al., 2017</xref>; <xref ref-type="bibr" rid="B20">Broddrick et al., 2019</xref>). Genes encoding at least three further plastidial oxidative stress-related proteins (Phatr3_J12583, encoding Fe-Mn family superoxide dismutase; Phatr3_J45252, encoding a plastidial thioredoxin; and Phatr3_J31436, encoding a plastidial ortholog of peroxisomal membrane protein 2, <xref ref-type="bibr" rid="B32">Davis et al., 2017</xref>; <xref ref-type="bibr" rid="B37">Dorrell et al., 2017</xref>) belong to the paleturquoise merged module, underlining its importance in oxidative stress responses.</p>
<p>Genes encoding both glutamine synthase (GS) and glutamate synthase/glutamine oxoglutarate aminotransferase (GOGAT), which have distinct plastidial and mitochondrial homologs in <italic>P. tricornutum</italic> (<xref ref-type="bibr" rid="B20">Broddrick et al., 2019</xref>; <xref ref-type="bibr" rid="B102">Smith et al., 2019</xref>), belong to different PhaeoNet merged modules (cyan, tan, steelblue and magenta), suggesting a relatively complex regulation of this hub. The plastid-localized GS (encoded by Phatr3_J51092) belongs to the magenta merged module, which also contains the subsequent genes encoding enzymes mediating the entry of GS-produced NH<sub>3</sub> into the mitochondrial ornithine-urea cycle (Phatr3_J42398 encoding malate dehydrogenase; Phatr3_J30145 encoding citrate synthase; Phatr3_J22913 encoding pyruvate kinase), suggesting this co-regulated pathway may have roles in recycling excess NH<sub>3</sub> produced in the chloroplast, in accordance with previous studies (<xref ref-type="bibr" rid="B68">Levering et al., 2016</xref>; <xref ref-type="bibr" rid="B20">Broddrick et al., 2019</xref>; <xref ref-type="bibr" rid="B102">Smith et al., 2019</xref>).</p>
<p>Finally, we noted the presence of genes encoding chloroplast-targeted plastoquinol terminal oxidase (Phatr3_J4283) and mitochondria-targeted alternative oxidase (Phatr3_EG02359), which are both associated with the photoprotective removal of excess metabolic reducing potential in the skyblue merged module (<xref ref-type="bibr" rid="B8">Bailleul et al., 2015</xref>; <xref ref-type="bibr" rid="B81">Murik et al., 2019</xref>). This merged module, as discussed above, contains genes encoding three successive enzymes associated with the TCA cycle (Phatr3_J40430 encoding &#x03B1;-ketoglutaryl dehydrogenase; Phatr3_J42015 encoding succinyl-CoA synthetase and Phatr3_J41812 encoding succinate dehydrogenase; <xref ref-type="bibr" rid="B63">Kroth et al., 2008</xref>), along with methylmalonyl-CoA mutase (Phatr3_J51830), which may allow excess succinyl-CoA to be diverted into lipid synthesis via propionyl-CoA (<xref ref-type="bibr" rid="B50">Helliwell et al., 2011</xref>; <xref ref-type="bibr" rid="B111">Valenzuela et al., 2012</xref>). This co-regulation underlines the importance of the succinate hub, and presumably both the glyoxylate cycle and ornithine shunt (as sources of mitochondrial &#x03B1;-ketoglutarate), as routes for the mitochondrial dissipation of excess chloroplast reducing potential (<xref ref-type="bibr" rid="B8">Bailleul et al., 2015</xref>; <xref ref-type="bibr" rid="B20">Broddrick et al., 2019</xref>).</p>
</sec>
<sec id="S3.SS6">
<title>Transcriptional Regulators of Chloroplast-Targeted Proteins Show Separate Expression Dynamics, Informed by Evolutionary History</title>
<p>Finally, given the complex transcriptional partitioning of genes encoding components of chloroplast and mitochondrial metabolism pathways across PhaeoNet data, we investigated what transcriptional drivers might be implicated in the co-regulation of different metabolism-enriched pathway clusters. First, we considered the repartition of a manually curated list of genes encoding proteins implied in histone and transcription-related processes (including transcription factors, TFs; <xref ref-type="bibr" rid="B93">Rayko et al., 2010</xref>; <xref ref-type="bibr" rid="B9">Banerjee et al., 2016</xref>) across all merged modules (<xref ref-type="supplementary-material" rid="FS7">Supplementary Figure 7</xref> and <xref ref-type="supplementary-material" rid="TS4">Supplementary Table 4</xref>). These genes were most frequently observed (&#x003E;5% of total merged module genes) in the darkgray, brown and steelblue merged modules (<xref ref-type="supplementary-material" rid="FS7">Supplementary Figure 7</xref> and <xref ref-type="fig" rid="F3">Figure 3</xref>). The brown and darkgray merged modules were additionally enriched in KEGG merged modules related to cytoskeleton proteins (<xref ref-type="supplementary-material" rid="FS4">Supplementary Figure 4</xref>), pointing to close links between cytoskeletal organization and transcriptional regulation in diatoms (for example, within organization of the cell cycle (<xref ref-type="bibr" rid="B54">Huysman et al., 2013</xref>; <xref ref-type="bibr" rid="B108">Tanaka et al., 2015</xref>). The single most abundant TF family, heat shock factor family (HSF) proteins (<xref ref-type="bibr" rid="B93">Rayko et al., 2010</xref>), were most frequently detected in the brown, brown4, cyan and skyblue merged modules (&#x003E; 5 HSFs each, <xref ref-type="supplementary-material" rid="FS7">Supplementary Figure 7</xref>). Notably, both the brown and brown4 merged modules are also enriched in KEGG functions associated with stress responses (protein ubiquitinylation, autophagy and membrane trafficking) (<xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>), consistent with previously inferred functions of specific <italic>P. tricornutum</italic> HSFs in the maintenance of cellular fitness (<xref ref-type="bibr" rid="B27">Chen et al., 2014</xref>; <xref ref-type="bibr" rid="B38">Egue et al., 2015</xref>).</p>
<p>We also found specific repartitions of genes encoding proteins implicated in light- and circadian-dependent transcriptional responses in <italic>P. tricornutum</italic>, e.g., aureochromes and cryptochromes (<xref ref-type="bibr" rid="B107">Takahashi et al., 2007</xref>; <xref ref-type="bibr" rid="B9">Banerjee et al., 2016</xref>). These proteins typically have cytoplasmic localizations, but through the perception of light and translocation to the nucleus can regulate the expression of core chloroplast metabolic pathways (<xref ref-type="bibr" rid="B64">Kroth et al., 2017</xref>). The circadian-regulated Aureochrome 1c (Phatr3_J12346; <xref ref-type="bibr" rid="B9">Banerjee et al., 2016</xref>; <xref ref-type="bibr" rid="B64">Kroth et al., 2017</xref>) and a cryptochrome-like blue light receptor (Phatr3_J34592) were both found in the blue merged module, implicated in anabolic metabolism; and the light-regulated Aureochrome 1b (Phatr3_J15977) and the blue-light-dependent protochlorophyllide reductase 1 (Phatr3_J12155; <xref ref-type="bibr" rid="B53">Hunsperger et al., 2016</xref>; <xref ref-type="bibr" rid="B73">Mann et al., 2017</xref>) were both found in the lightsteelblue1 merged module, alongside the majority of genes encoding other pigment biosynthesis enzymes. In contrast, the gene encoding Aureochrome 1a (Phatr3_J49116), which is essential for high light acclimation but appears to be under exclusively circadian (light-independent) regulation, falls within the lightcyan1 merged module of core photosystem-associated genes (<xref ref-type="supplementary-material" rid="TS4">Supplementary Table 4</xref> and <xref ref-type="supplementary-material" rid="FS7">Supplementary Figure 7</xref>; <xref ref-type="bibr" rid="B9">Banerjee et al., 2016</xref>; <xref ref-type="bibr" rid="B73">Mann et al., 2017</xref>); while RITMO1 (Phatr3_J44962), associated with the <italic>P. tricornutum</italic> circadian clock, falls within the skyblue merged module, which contains limited chloroplast-related functions except for alternative electron flow pathways (<xref ref-type="supplementary-material" rid="TS4">Supplementary Table 4</xref> and <xref ref-type="supplementary-material" rid="FS7">Supplementary Figure 7</xref>; <xref ref-type="bibr" rid="B4">Annunziata et al., 2019</xref>). The separate distributions of light- and circadian-regulated chloroplast regulators might reflect a circadian-entrained synthesis of the core photosynthetic machinery (via Aureochrome 1a), independent of light status, with chloroplast biosynthesis pathways upregulated both by circadian signaling (via Aureochrome 1c) and as a function of light availability (via Aureochrome 1b). This is reminiscent of circadian gene expression patterns visualized in plant and other algal lineages (e.g., the green alga <italic>Ostreococcus</italic> and the dinoflagellate <italic>Lingulodinium</italic>), in which photosynthesis and plastid biogenesis proteins are either expressed at separate times of the day, or show different regulatory responses to circadian and light signals (<xref ref-type="bibr" rid="B117">Wang et al., 2005</xref>; <xref ref-type="bibr" rid="B78">Monnier et al., 2010</xref>; <xref ref-type="bibr" rid="B83">Noordally et al., 2013</xref>). Finally, the gene encoding the Aureochrome 2 protein (Phatr3_J8113), which lacks the conserved flavin-binding domain required for light perception (<xref ref-type="bibr" rid="B107">Takahashi et al., 2007</xref>; <xref ref-type="bibr" rid="B64">Kroth et al., 2017</xref>), falls within the greenyellow merged module of generally transcriptionally repressed proteins (<xref ref-type="fig" rid="F3">Figure 3</xref>), underlining its independence of chloroplast functions.</p>
<p>Finally, we wished to consider within our dataset what transcriptional dynamics within the nuclear genome may underpin chloroplast gene expression in <italic>P. tricornutum.</italic> Chloroplast transcription in <italic>P. tricornutum</italic>, as in other diatoms, is performed by a plastid-encoded RNA polymerase, unlike the situation in plants in which both plastid- and nuclear-encoded and plastid-targeted polymerases participate (<xref ref-type="bibr" rid="B88">Oudot-Le Secq et al., 2007</xref>; <xref ref-type="bibr" rid="B119">Yu et al., 2018</xref>). Plastid-encoded RNA polymerases in plants typically interact with nucleus-encoded sigma factors, which may direct them to specific target genes, in response to different regulatory and physiological signals (<xref ref-type="bibr" rid="B101">Shimizu et al., 2010</xref>; <xref ref-type="bibr" rid="B83">Noordally et al., 2013</xref>). Eight genes are annotated in the <italic>P. tricornutum</italic> nuclear genome to encode sigma factor related proteins (<xref ref-type="bibr" rid="B93">Rayko et al., 2010</xref>; <xref ref-type="supplementary-material" rid="TS4">Supplementary Table 4</xref>), but the functions of each protein with regard to the expression of the chloroplast genome remain unclear.</p>
<p>We investigated the functions of <italic>P. tricornutum</italic> sigma factors by combining the repartition of each sigma factor in PhaeoNet with predicted <italic>in silico</italic> localizations of <italic>P. tricornutum</italic> proteins and their closest homologs from other diatom species, as resolved with a single-gene (RAxML) tree (<xref ref-type="fig" rid="F5">Figure 5</xref>). Three of the sigma factor genes in <italic>P. tricornutum</italic> possess chloroplast-targeting sequences, as inferred by <italic>in silico</italic> prediction with HECTAR and ASAFind (<xref ref-type="bibr" rid="B47">Gschloessl et al., 2008</xref>; <xref ref-type="bibr" rid="B46">Gruber et al., 2015</xref>). One of these proteins (Phatr3_J14599, SIGMA1a) falls within the paleturquoise merged module, which is otherwise enriched in chloroplast-related functions pertaining to carbon concentration and the glycine shunt (<xref ref-type="fig" rid="F3">Figures 3&#x2013;5</xref>); while the two remaining chloroplast-targeted proteins (Phatr3_J3388, SIGMA1b; Phatr3_J17029, SIGMA3) fall within the steelblue module, which otherwise lacks obvious enrichments in chloroplast-targeted functions and instead seems to be most closely connected to nucleotide metabolism (<xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F5">5</xref>). Phylogenetic analysis of these three sigma factors indicate that many of their closest relatives are sequences with chloroplast-targeting signals from other diatoms, and indeed SIGMA1a and SIGMA1b appear to be recently derived paralogs of one another (<xref ref-type="fig" rid="F5">Figure 5</xref>), indicating that they are likely to be conserved parts of the diatom chloroplast transcriptional machinery. The repartition of SIGMA1b and SIGMA3 within a transcriptional module that is largely related to non-chloroplast processes may allow hierarchical control of chloroplast transcription in response to non-chloroplast signals in <italic>P. tricornutum</italic> (e.g., coordination with circadian or cell cycles, <xref ref-type="bibr" rid="B83">Noordally et al., 2013</xref>; <xref ref-type="bibr" rid="B108">Tanaka et al., 2015</xref>).</p>
<fig id="F5" position="float">
<label>FIGURE 5</label>
<caption><p>Phylogenetic and transcriptional dynamics of <italic>P. tricornutum</italic> sigma factors. This Figure shows an unrooted best-scoring tree topology for an 86 taxa x 453 aa alignment of subsampled diatom and non-diatom sigma factors and realized using MrBayes v 3.2.7a with the Jones substitution matrix, 600,000 generations, two start chains and 0.5 burnin thresholds (<xref ref-type="bibr" rid="B52">Huelsenbeck and Ronquist, 2001</xref>); and RAxML v 8.2 with the PROTGAMMAJTT substitution model with 300 bootstrap replicates (<xref ref-type="bibr" rid="B105">Stamatakis, 2014</xref>). Chloroplast-targeting predictions were performed using ASAFind with SignalP v 3.0 (<xref ref-type="bibr" rid="B46">Gruber et al., 2015</xref>); and HECTAR (<xref ref-type="bibr" rid="B47">Gschloessl et al., 2008</xref>) under default conditions. Branches are colored by phylogenetic affiliation and bootstrap values of nodes recovered with &#x003E; 40% support are shown. Eight <italic>P. tricornutum</italic> sigma factors are labeled with PhaeoNet merged module repartition and chloroplast targeting sequences were predicted by HECTAR or ASAFind (<xref ref-type="bibr" rid="B46">Gruber et al., 2015</xref>).</p></caption>
<graphic xlink:href="fpls-11-590949-g005.tif"/>
</fig>
<p>The remaining five <italic>P. tricornutum</italic> sigma factors were not predicted to be targeted to the chloroplast and phylogenetic analysis indicated that their closest diatom relatives primarily also lacked chloroplast-targeting signals (<xref ref-type="fig" rid="F5">Figure 5</xref>). One of these non-chloroplast-associated sigma factors (Phatr3_J5537, SIGMA2) fell within the largely chloroplast-independent brown module, suggesting that it has non-chloroplastic functions. In contrast, the remaining non-chloroplast targeted sigma factors fell within modules otherwise enriched in chloroplast-associated functions; either lightsteelblue (Phatr3_J9312, SIGMA4), or paleturquoise (Phatr3_J14908, Phatr3_J9855, Phatr3_J50183; SIGMA 5-7; <xref ref-type="fig" rid="F3">Figures 3</xref>, <xref ref-type="fig" rid="F5">5</xref>). It remains to be determined whether these sigma factors are targeted to the <italic>P. tricornutum</italic> chloroplast, but using alternative methods to those recognized by HECTAR or ASAFind, as per certain other diatom proteins (<xref ref-type="bibr" rid="B58">Kazamia et al., 2018</xref>; <xref ref-type="bibr" rid="B98">Schober et al., 2019</xref>); function in compartments other than the chloroplast, but participate indirectly in the regulation, e.g., of nucleus-encoded proteins implicated in chloroplast metabolism; or have functions independent of the chloroplast, as has been documented for some other eukaryotic sigma factors (<xref ref-type="bibr" rid="B99">Shadel and Clayton, 1995</xref>; <xref ref-type="bibr" rid="B12">Beardslee et al., 2002</xref>). These different possibilities may be best discriminated by the experimental characterization, e.g., through mutagenesis and functional phenotyping, of individual <italic>P. tricornutum</italic> sigma factor genes.</p>
</sec>
</sec>
<sec id="S4">
<title>Concluding Remarks</title>
<p>In this project, we have used WGCNA to build an integrated network of <italic>P. tricornutum</italic> gene co-regulation, which we name &#x201C;PhaeoNet.&#x201D; Our model is able to retrieve well established biological pathways (e.g., chloroplast photosynthetic, anabolic metabolism; and mitochondrial respiration, <xref ref-type="fig" rid="F4">Figure 4</xref>) and compares favorably to existing (e.g., microarray-based; <xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>) studies of gene co-regulation for this species (<xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>; <xref ref-type="fig" rid="F1">Figures 1</xref>, <xref ref-type="fig" rid="F2">2</xref> and <xref ref-type="supplementary-material" rid="FS1">Supplementary Figures 1&#x2013;4</xref>). Moreover, our dataset carries the advantage of decomposing the <italic>P. tricornutum</italic> genome into a smaller number (28) of functionally distinct modules than produced by DiatomPortal. We have integrated these data into previously generated functional, targeting and evolutionary analyses of the <italic>P. tricornutum</italic> genome, allowing us to gain holistic insights into the processes underpinning the gene co-regulation of specific biological processes and organelle metabolic pathways pertinent to diatom biology (<xref ref-type="fig" rid="F3">Figure 3</xref> and <xref ref-type="supplementary-material" rid="FS5">Supplementary Figure 5</xref>).</p>
<p>Through a deeper inspection of genes encoding chloroplast and mitochondria-targeted proteins within these data, we identify PhaeoNet merged modules underpinning anabolic (blue), photosynthetic (lightsteelblue 1, lightcyan1) and respiratory (orangered4, cyan) metabolism, and identify multiple metabolic connections between the chloroplast and mitochondria. These include the glycine shunt within the paleturquoise merged module; the ornithine-urea cycle within the magenta merged module; and coordinated chloroplast and mitochondrial alternative oxidase activities in the skyblue merged module; <xref ref-type="fig" rid="F4">Figure 4</xref> and <xref ref-type="supplementary-material" rid="FS6">Supplementary Figure 6</xref>. Finally, considering the repartition of transcription-related proteins within our data, we identify probable cognate regulators for different co-ordinated metabolic pathways (<xref ref-type="fig" rid="F5">Figure 5</xref> and <xref ref-type="supplementary-material" rid="FS7">Supplementary Figure 7</xref>), demonstrating different associations of aureochrome transcription factors with different chloroplast metabolic pathways. We notably identify hidden diversity in the range of sigma factor genes in the <italic>P. tricornutum</italic> genome, some of which are likely to be involved in the transcriptional regulation of different chloroplast-encoded genes in response to different physiological signals, while others are likely to have different functions to chloroplast gene expression.</p>
<p>The PhaeoNet dataset may be usable as a predictive tool for the characterization of poorly understood proteins, either directly in <italic>P. tricornutum</italic>, as a well-studied model diatom species, or in other diatom or microalgal species for which homologs of <italic>P. tricornutum</italic> proteins are known either from genome or transcriptome datasets (e.g., <xref ref-type="bibr" rid="B60">Keeling et al., 2014</xref>; <xref ref-type="bibr" rid="B25">Carradec et al., 2018</xref>; <xref ref-type="bibr" rid="B97">Sato et al., 2020</xref>). We stress that biological processes elucidated in this species may not necessarily be directly extrapolatable to other algal species; and examples are already known of proteins (e.g., proteins involved in iron-stress tolerance and C4 photosynthesis) that may have different physiological functions even between different diatoms (<xref ref-type="bibr" rid="B65">Kustka et al., 2014</xref>; <xref ref-type="bibr" rid="B66">Lampe et al., 2018</xref>). Cross-comparisons between PhaeoNet and other data, e.g., gene coregulation datasets erected in other, less well-studied species (<xref ref-type="bibr" rid="B7">Ashworth et al., 2016</xref>; <xref ref-type="bibr" rid="B6">Ashworth and Ralph, 2018</xref>); environmental expression trends (<xref ref-type="bibr" rid="B25">Carradec et al., 2018</xref>); and the phenotypes of a wider range of mutant lines generated in <italic>P. tricornutum</italic> will be essential to understanding the diversity of functions performed by understudied proteins in diatoms and other algae. Nonetheless, insights from our data, delivering actors and signatures of metabolic co-regulation in diatoms, will provide a useful community resource for subsequent directed experimental investigation.</p>
</sec>
<sec id="S5">
<title>Data Availability Statement</title>
<p>Publicly available datasets were analyzed in this study. This data can be found here: <ext-link ext-link-type="uri" xlink:href="https://osf.io/42xmp/">https://osf.io/42xmp/</ext-link>.</p>
</sec>
<sec id="S6">
<title>Author Contributions</title>
<p>OA-M was responsible for the design and construction of PhaeoNet. AMGNV and NJ performed the functional analysis of the PhaeoNet modules. YL and XZ participated in the construction of the data used for functional analysis. AG, LT, and CB were responsible for the supervision of the construction of PhaeoNet. RGD was responsible for the supervision of functional analysis. OA-M and RGD wrote the manuscript, with input from all other co-authors. All authors contributed to the article and approved the submitted version.</p>
</sec>
<sec id="conf1">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
</body>
<back>
<fn-group>
<fn fn-type="financial-disclosure">
<p><bold>Funding.</bold> RGD and AMGNV acknowledge funding from a CNRS Momentum Fellowship (awarded to RGD, 2019-2021). CB acknowledges funding from the European Research Council for an Advanced Award (grant ERC 835067-DIATOMIC), grants from the French Agence Nationale de la Recherche (MEMOLIFE, ref. ANR10-LABX-54, OCEANOMICS, ref. ANR-11-BTBR-0008 and BrownCut, ref. ANR-19-CE20-0020) and Research Grant &#x201C;Green Life in the Dark&#x201D; (RGP0003/2016) from the Human Frontier Science Program. LT acknowledges funding from the CNRS, the region of Pays de la Loire (ConnecTalent EPIALG project) and Nantes m&#x00E9;tropoles. XZ acknowledges a Ph.D. fellowship from the Chinese Scholarship Council (CSC-201604910722) and funding from R&#x00E9;gion Pays de la Loire (Awarded to LT).</p>
</fn>
</fn-group>
<ack>
<p>We would like to thank Dr. Justin Ashworth (University of Technology Sydney) and Dr. Serdar Turkarslan (Institute for Systems Biology, Seattle) for the kind provision of analogous cluster composition data from the DiatomPortal project and Prof. Angela Falciatore (Institut de Biologie Physico-Chimique, Paris) for assistance with the annotation of <italic>P. tricornutum</italic> transcription factors.</p>
</ack>
<sec id="S9" sec-type="supplementary material"><title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.frontiersin.org/articles/10.3389/fpls.2020.590949/full#supplementary-material">https://www.frontiersin.org/articles/10.3389/fpls.2020.590949/full#supplementary-material</ext-link></p>
<supplementary-material xlink:href="Table_1.XLSX" id="TS1" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_2.XLSX" id="TS2" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_3.XLSX" id="TS3" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_4.XLSX" id="TS4" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Table_5.XLSX" id="TS5" mimetype="application/vnd.openxmlformats-officedocument.spreadsheetml.sheet" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_1.TIFF" id="FS1" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_2.TIFF" id="FS2" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_3.TIFF" id="FS3" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_4.TIFF" id="FS4" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_5.TIFF" id="FS5" mimetype="image/tiff" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_6.JPEG" id="FS6" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="Image_7.JPEG" id="FS7" mimetype="image/jpeg" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<ref-list>
<title>References</title>
<ref id="B1"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aibar</surname> <given-names>S.</given-names></name> <name><surname>Fontanillo</surname> <given-names>C.</given-names></name> <name><surname>Droste</surname> <given-names>C.</given-names></name> <name><surname>De Las Rivas</surname> <given-names>J.</given-names></name></person-group> (<year>2015</year>). <article-title>Functional gene networks: R/Bioc package to generate and analyse gene networks derived from functional enrichment and clustering.</article-title> <source><italic>Bioinformatics</italic></source> <volume>31</volume> <fpage>1686</fpage>&#x2013;<lpage>1688</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu864</pub-id> <pub-id pub-id-type="pmid">25600944</pub-id></citation></ref>
<ref id="B2"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Allen</surname> <given-names>A. E.</given-names></name> <name><surname>Laroche</surname> <given-names>J.</given-names></name> <name><surname>Maheswari</surname> <given-names>U.</given-names></name> <name><surname>Lommer</surname> <given-names>M.</given-names></name> <name><surname>Schauer</surname> <given-names>N.</given-names></name> <name><surname>Lopez</surname> <given-names>P. J.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Whole-cell response of the pennate diatom <italic>Phaeodactylum tricornutum</italic> to iron starvation.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>105</volume> <fpage>10438</fpage>&#x2013;<lpage>10443</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0711370105</pub-id> <pub-id pub-id-type="pmid">18653757</pub-id></citation></ref>
<ref id="B3"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Allen</surname> <given-names>J. F.</given-names></name></person-group> (<year>2003</year>). <article-title>The function of genomes in bioenergetic organelles.</article-title> <source><italic>Phil. Trans. R. Soc. Biol.</italic></source> <volume>358</volume> <fpage>19</fpage>&#x2013;<lpage>37</lpage>. <pub-id pub-id-type="doi">10.1098/rstb.2002.1191</pub-id> <pub-id pub-id-type="pmid">12594916</pub-id></citation></ref>
<ref id="B4"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Annunziata</surname> <given-names>R.</given-names></name> <name><surname>Ritter</surname> <given-names>A.</given-names></name> <name><surname>Fortunato</surname> <given-names>A. E.</given-names></name> <name><surname>Manzotti</surname> <given-names>A.</given-names></name> <name><surname>Cheminant-Navarro</surname> <given-names>S.</given-names></name> <name><surname>Agier</surname> <given-names>N.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>bHLH-PAS protein RITMO1 regulates diel biological rhythms in the marine diatom P. <italic>tricornutum</italic>.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>116</volume> <fpage>13137</fpage>&#x2013;<lpage>13142</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1819660116</pub-id> <pub-id pub-id-type="pmid">31171659</pub-id></citation></ref>
<ref id="B5"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Aramaki</surname> <given-names>T.</given-names></name> <name><surname>Blanc-Mathieu</surname> <given-names>R.</given-names></name> <name><surname>Endo</surname> <given-names>H.</given-names></name> <name><surname>Ohkubo</surname> <given-names>K.</given-names></name> <name><surname>Kanehisa</surname> <given-names>M.</given-names></name> <name><surname>Goto</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>KofamKOALA: KEGG ortholog assignment based on profile HMM and adaptive score threshold.</article-title> <source><italic>Bioinformatics.</italic></source> <volume>36</volume> <fpage>2251</fpage>&#x2013;<lpage>2252</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btz859</pub-id> <pub-id pub-id-type="pmid">31742321</pub-id></citation></ref>
<ref id="B6"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ashworth</surname> <given-names>J.</given-names></name> <name><surname>Ralph</surname> <given-names>P. J.</given-names></name></person-group> (<year>2018</year>). <article-title>An explorable public transcriptomics compendium for eukaryotic microalgae.</article-title> <source><italic>bioRxiv[Preprint].</italic></source> <pub-id pub-id-type="doi">10.1101/403063</pub-id></citation></ref>
<ref id="B7"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Ashworth</surname> <given-names>J.</given-names></name> <name><surname>Turkarslan</surname> <given-names>S.</given-names></name> <name><surname>Harris</surname> <given-names>M.</given-names></name> <name><surname>Orellana</surname> <given-names>M. V.</given-names></name> <name><surname>Baliga</surname> <given-names>N. S.</given-names></name></person-group> (<year>2016</year>). <article-title>Pan-transcriptomic analysis identifies coordinated and orthologous functional modules in the diatoms <italic>Thalassiosira pseudonana</italic> and <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Mar. Genom.</italic></source> <volume>26</volume> <fpage>21</fpage>&#x2013;<lpage>28</lpage>. <pub-id pub-id-type="doi">10.1016/j.margen.2015.10.011</pub-id> <pub-id pub-id-type="pmid">26560047</pub-id></citation></ref>
<ref id="B8"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bailleul</surname> <given-names>B.</given-names></name> <name><surname>Berne</surname> <given-names>N.</given-names></name> <name><surname>Murik</surname> <given-names>O.</given-names></name> <name><surname>Petroutsos</surname> <given-names>D.</given-names></name> <name><surname>Prihoda</surname> <given-names>J.</given-names></name> <name><surname>Tanaka</surname> <given-names>A.</given-names></name></person-group> (<year>2015</year>). <article-title>Energetic coupling between plastids and mitochondria drives CO2 assimilation in diatoms.</article-title> <source><italic>Nature</italic></source> <volume>524</volume> <fpage>366</fpage>&#x2013;<lpage>371</lpage>. <pub-id pub-id-type="doi">10.1038/nature14599</pub-id> <pub-id pub-id-type="pmid">26168400</pub-id></citation></ref>
<ref id="B9"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Banerjee</surname> <given-names>A.</given-names></name> <name><surname>Herman</surname> <given-names>E.</given-names></name> <name><surname>Serif</surname> <given-names>M.</given-names></name> <name><surname>Maestre-Reyna</surname> <given-names>M.</given-names></name> <name><surname>Hepp</surname> <given-names>S.</given-names></name> <name><surname>Pokorny</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Allosteric communication between DNA-binding and light-responsive domains of diatom class I aureochromes.</article-title> <source><italic>Nucl. Acids Res.</italic></source> <volume>44</volume> <fpage>5957</fpage>&#x2013;<lpage>5970</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkw420</pub-id> <pub-id pub-id-type="pmid">27179025</pub-id></citation></ref>
<ref id="B10"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Barab&#x00E1;si</surname> <given-names>A. L.</given-names></name></person-group> (<year>2009</year>). <article-title>Scale-free networks: a decade and beyond.</article-title> <source><italic>Science</italic></source> <volume>325</volume> <fpage>412</fpage>&#x2013;<lpage>413</lpage>. <pub-id pub-id-type="doi">10.1126/science.1173299</pub-id> <pub-id pub-id-type="pmid">19628854</pub-id></citation></ref>
<ref id="B11"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>B&#x00E1;rtov&#x00E1;</surname> <given-names>E.</given-names></name> <name><surname>Krej&#x010D;&#x00ED;</surname> <given-names>J.</given-names></name> <name><surname>Harni&#x011B;arov&#x00E1;</surname> <given-names>A.</given-names></name> <name><surname>Galiov&#x00E1;</surname> <given-names>G.</given-names></name> <name><surname>Kozubek</surname> <given-names>S.</given-names></name></person-group> (<year>2008</year>). <article-title>Histone modifications and nuclear architecture: a review.</article-title> <source><italic>J. Histochem. Cytochem</italic></source> <volume>56</volume> <fpage>711</fpage>&#x2013;<lpage>721</lpage>. <pub-id pub-id-type="doi">10.1369/jhc.2008.951251</pub-id> <pub-id pub-id-type="pmid">18474937</pub-id></citation></ref>
<ref id="B12"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Beardslee</surname> <given-names>T. A.</given-names></name> <name><surname>Roy-Chowdhury</surname> <given-names>S.</given-names></name> <name><surname>Jaiswal</surname> <given-names>P.</given-names></name> <name><surname>Buhot</surname> <given-names>L.</given-names></name> <name><surname>Lerbs-Mache</surname> <given-names>S.</given-names></name> <name><surname>Stern</surname> <given-names>D. B.</given-names></name><etal/></person-group> (<year>2002</year>). <article-title>A nucleus-encoded maize protein with sigma factor activity accumulates in mitochondria and chloroplasts.</article-title> <source><italic>Plant. J.</italic></source> <volume>31</volume> <fpage>199</fpage>&#x2013;<lpage>209</lpage>. <pub-id pub-id-type="doi">10.1046/j.1365-313x.2002.01344.x</pub-id> <pub-id pub-id-type="pmid">12121449</pub-id></citation></ref>
<ref id="B13"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bendtsen</surname> <given-names>J. D.</given-names></name> <name><surname>Nielsen</surname> <given-names>H.</given-names></name> <name><surname>von Heijne</surname> <given-names>G.</given-names></name> <name><surname>Brunak</surname> <given-names>S.</given-names></name></person-group> (<year>2004</year>). <article-title>Improved prediction of signal peptides: SignalP 3.0.</article-title> <source><italic>J. Mol. Biol</italic></source> <volume>340</volume> <fpage>783</fpage>&#x2013;<lpage>795</lpage>. <pub-id pub-id-type="doi">10.1016/j.jmb.2004.05.028</pub-id> <pub-id pub-id-type="pmid">15223320</pub-id></citation></ref>
<ref id="B14"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bentley</surname> <given-names>D. R.</given-names></name> <name><surname>Balasubramanian</surname> <given-names>S.</given-names></name> <name><surname>Swerdlow</surname> <given-names>H. P.</given-names></name> <name><surname>Smith</surname> <given-names>G. P.</given-names></name> <name><surname>Milton</surname> <given-names>J.</given-names></name> <name><surname>Brown</surname> <given-names>C. G.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Accurate whole human genome sequencing using reversible terminator chemistry.</article-title> <source><italic>Nature</italic></source> <volume>456</volume> <fpage>53</fpage>&#x2013;<lpage>59</lpage>. <pub-id pub-id-type="doi">10.1038/nature07517</pub-id> <pub-id pub-id-type="pmid">18987734</pub-id></citation></ref>
<ref id="B15"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bertrand</surname> <given-names>M.</given-names></name></person-group> (<year>2010</year>). <article-title>Carotenoid biosynthesis in diatoms.</article-title> <source><italic>Photosynthesis Res.</italic></source> <volume>106</volume> <fpage>89</fpage>&#x2013;<lpage>102</lpage>. <pub-id pub-id-type="doi">10.1007/s11120-010-9589-x</pub-id> <pub-id pub-id-type="pmid">20734232</pub-id></citation></ref>
<ref id="B16"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bird</surname> <given-names>A.</given-names></name></person-group> (<year>2002</year>). <article-title>DNA methylation patterns and epigenetic memory.</article-title> <source><italic>Genes Dev.</italic></source> <volume>16</volume> <fpage>6</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1101/gad.947102</pub-id> <pub-id pub-id-type="pmid">11782440</pub-id></citation></ref>
<ref id="B17"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bohne</surname> <given-names>A.-V.</given-names></name> <name><surname>Schwenkert</surname> <given-names>S.</given-names></name> <name><surname>Grimm</surname> <given-names>B.</given-names></name> <name><surname>Nickelsen</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>Roles of tetratricopeptide repeat proteins in biogenesis of the photosynthetic apparatus.</article-title> <source><italic>Int. Rev. Cell Mol. Biol.</italic></source> <volume>324</volume> <fpage>187</fpage>&#x2013;<lpage>227</lpage>. <pub-id pub-id-type="doi">10.1016/bs.ircmb.2016.01.005</pub-id> <pub-id pub-id-type="pmid">27017009</pub-id></citation></ref>
<ref id="B18"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bowler</surname> <given-names>C.</given-names></name> <name><surname>Allen</surname> <given-names>A. E.</given-names></name> <name><surname>Badger</surname> <given-names>J. H.</given-names></name> <name><surname>Grimwood</surname> <given-names>J.</given-names></name> <name><surname>Jabbari</surname> <given-names>K.</given-names></name> <name><surname>Kuo</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>The P. <italic>tricornutum</italic> genome reveals the evolutionary history of diatom genomes.</article-title> <source><italic>Nature</italic></source> <volume>456</volume> <fpage>239</fpage>&#x2013;<lpage>244</lpage>. <pub-id pub-id-type="doi">10.1038/nature07410</pub-id> <pub-id pub-id-type="pmid">18923393</pub-id></citation></ref>
<ref id="B19"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bowler</surname> <given-names>C.</given-names></name> <name><surname>Vardi</surname> <given-names>A.</given-names></name> <name><surname>Allen</surname> <given-names>A. E.</given-names></name></person-group> (<year>2010</year>). <article-title>Oceanographic and biogeochemical insights from diatom genomes.</article-title> <source><italic>Ann. Rev. Mar. Sci.</italic></source> <volume>2</volume> <fpage>333</fpage>&#x2013;<lpage>365</lpage>. <pub-id pub-id-type="doi">10.1146/annurev-marine-120308-081051</pub-id> <pub-id pub-id-type="pmid">21141668</pub-id></citation></ref>
<ref id="B20"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Broddrick</surname> <given-names>J. T.</given-names></name> <name><surname>Du</surname> <given-names>N.</given-names></name> <name><surname>Smith</surname> <given-names>S. R.</given-names></name> <name><surname>Tsuji</surname> <given-names>Y.</given-names></name> <name><surname>Jallet</surname> <given-names>D.</given-names></name> <name><surname>Ware</surname> <given-names>M. A.</given-names></name></person-group> (<year>2019</year>). <article-title>Cross-compartment metabolic coupling enables flexible photoprotective mechanisms in the diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>New Phytol.</italic></source> <volume>222</volume> <fpage>1364</fpage>&#x2013;<lpage>1379</lpage>. <pub-id pub-id-type="doi">10.1111/nph.15685</pub-id> <pub-id pub-id-type="pmid">30636322</pub-id></citation></ref>
<ref id="B21"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Bromke</surname> <given-names>M. A.</given-names></name></person-group> (<year>2013</year>). <article-title>Amino Acid biosynthesis pathways in diatoms.</article-title> <source><italic>Metabolites</italic></source> <volume>3</volume> <fpage>294</fpage>&#x2013;<lpage>311</lpage>. <pub-id pub-id-type="doi">10.3390/metabo3020294</pub-id> <pub-id pub-id-type="pmid">24957993</pub-id></citation></ref>
<ref id="B22"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>B&#x00FC;chel</surname> <given-names>C.</given-names></name></person-group> (<year>2015</year>). <article-title>Evolution and function of light harvesting proteins.</article-title> <source><italic>J. Plant. Physiol.</italic></source> <volume>172</volume> <fpage>62</fpage>&#x2013;<lpage>75</lpage>. <pub-id pub-id-type="doi">10.1016/j.jplph.2014.04.018</pub-id> <pub-id pub-id-type="pmid">25240794</pub-id></citation></ref>
<ref id="B23"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Buck</surname> <given-names>J. M.</given-names></name> <name><surname>Sherman</surname> <given-names>J.</given-names></name> <name><surname>R&#x00ED;o B&#x00E1;rtulos</surname> <given-names>C.</given-names></name> <name><surname>Serif</surname> <given-names>M.</given-names></name> <name><surname>Halder</surname> <given-names>M.</given-names></name> <name><surname>Henkel</surname> <given-names>J.</given-names></name></person-group> (<year>2019</year>). <article-title>Lhcx proteins provide photoprotection via thermal dissipation of absorbed light in the diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>10</volume>:<issue>4167</issue>. <pub-id pub-id-type="doi">10.1038/s41467-019-12043-6</pub-id> <pub-id pub-id-type="pmid">31519883</pub-id></citation></ref>
<ref id="B24"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Capella-Guti&#x00E9;rrez</surname> <given-names>S.</given-names></name> <name><surname>Silla-Mart&#x00ED;nez</surname> <given-names>J. M.</given-names></name> <name><surname>Gabald&#x00F3;n</surname> <given-names>T.</given-names></name></person-group> (<year>2009</year>). <article-title>trimAl: a tool for automated alignment trimming in large-scale phylogenetic analyses.</article-title> <source><italic>Bioinformatics</italic></source> <volume>25</volume> <fpage>1972</fpage>&#x2013;<lpage>1973</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btp348</pub-id> <pub-id pub-id-type="pmid">19505945</pub-id></citation></ref>
<ref id="B25"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Carradec</surname> <given-names>Q.</given-names></name> <name><surname>Pelletier</surname> <given-names>E.</given-names></name> <name><surname>Da Silva</surname> <given-names>C.</given-names></name> <name><surname>Alberti</surname> <given-names>A.</given-names></name> <name><surname>Seeleuthner</surname> <given-names>Y.</given-names></name> <name><surname>Blanc-Mathieu</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>A global ocean atlas of eukaryotic genes.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>9</volume>:<issue>373</issue>. <pub-id pub-id-type="doi">10.1038/s41467-017-02342-1</pub-id> <pub-id pub-id-type="pmid">29371626</pub-id></citation></ref>
<ref id="B26"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chappell</surname> <given-names>P. D.</given-names></name> <name><surname>Whitney</surname> <given-names>L. P.</given-names></name> <name><surname>Wallace</surname> <given-names>J. R.</given-names></name> <name><surname>Darer</surname> <given-names>A. I.</given-names></name> <name><surname>Jean-Charles</surname> <given-names>S.</given-names></name> <name><surname>Jenkins</surname> <given-names>B. D.</given-names></name></person-group> (<year>2015</year>). <article-title>Genetic indicators of iron limitation in wild populations of Thalassiosira oceanica from the northeast Pacific Ocean.</article-title> <source><italic>ISME J.</italic></source> <volume>9</volume> <fpage>592</fpage>&#x2013;<lpage>602</lpage>. <pub-id pub-id-type="doi">10.1038/ismej.2014.171</pub-id> <pub-id pub-id-type="pmid">25333460</pub-id></citation></ref>
<ref id="B27"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chen</surname> <given-names>Z.</given-names></name> <name><surname>Yang</surname> <given-names>M. K.</given-names></name> <name><surname>Li</surname> <given-names>C. Y.</given-names></name> <name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Zhang</surname> <given-names>J.</given-names></name> <name><surname>Wang</surname> <given-names>D. B.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Phosphoproteomic analysis provides novel insights into stress responses in <italic>Phaeodactylum tricornutum</italic>, a model diatom.</article-title> <source><italic>J Proteom. Res.</italic></source> <volume>13</volume> <fpage>2511</fpage>&#x2013;<lpage>2523</lpage>. <pub-id pub-id-type="doi">10.1021/pr401290u</pub-id> <pub-id pub-id-type="pmid">24712722</pub-id></citation></ref>
<ref id="B28"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Chi</surname> <given-names>W.</given-names></name> <name><surname>Ma</surname> <given-names>J.</given-names></name> <name><surname>Zhang</surname> <given-names>L.</given-names></name></person-group> (<year>2012</year>). <article-title>Regulatory factors for the assembly of thylakoid membrane protein complexes.</article-title> <source><italic>Phil. Trans. R. Soc. B</italic></source> <volume>367</volume> <fpage>3420</fpage>&#x2013;<lpage>3429</lpage>. <pub-id pub-id-type="doi">10.1098/rstb.2012.0065</pub-id> <pub-id pub-id-type="pmid">23148269</pub-id></citation></ref>
<ref id="B29"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cihlar</surname> <given-names>J.</given-names></name> <name><surname>Fussy</surname> <given-names>Z.</given-names></name> <name><surname>Horak</surname> <given-names>A.</given-names></name> <name><surname>Obornik</surname> <given-names>M.</given-names></name></person-group> (<year>2016</year>). <article-title>Evolution of the tetrapyrrole biosynthetic pathway in secondary algae: conservation, redundancy and replacement.</article-title> <source><italic>PLoS One</italic></source> <volume>11</volume>:<issue>0166338</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0166338</pub-id> <pub-id pub-id-type="pmid">27861576</pub-id></citation></ref>
<ref id="B30"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Cruz de Carvalho</surname> <given-names>M. H.</given-names></name> <name><surname>Sun</surname> <given-names>H. X.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name> <name><surname>Chua</surname> <given-names>N. H.</given-names></name></person-group> (<year>2016</year>). <article-title>Noncoding and coding transcriptome responses of a marine diatom to phosphate fluctuations.</article-title> <source><italic>New Phytol.</italic></source> <volume>210</volume> <fpage>497</fpage>&#x2013;<lpage>510</lpage>. <pub-id pub-id-type="doi">10.1111/nph.13787</pub-id> <pub-id pub-id-type="pmid">26680538</pub-id></citation></ref>
<ref id="B31"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dautermann</surname> <given-names>O.</given-names></name> <name><surname>Lohr</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>A functional zeaxanthin epoxidase from red algae shedding light on the evolution of light-harvesting carotenoids and the xanthophyll cycle in photosynthetic eukaryotes.</article-title> <source><italic>Plant J.</italic></source> <volume>92</volume> <fpage>879</fpage>&#x2013;<lpage>891</lpage>. <pub-id pub-id-type="doi">10.1111/tpj.13725</pub-id> <pub-id pub-id-type="pmid">28949044</pub-id></citation></ref>
<ref id="B32"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Davis</surname> <given-names>A.</given-names></name> <name><surname>Abbriano</surname> <given-names>R.</given-names></name> <name><surname>Smith</surname> <given-names>S. R.</given-names></name> <name><surname>Hildebrand</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>Clarification of photorespiratory processes and the role of Malic Enzyme in diatoms.</article-title> <source><italic>Protist</italic></source> <volume>168</volume> <fpage>134</fpage>&#x2013;<lpage>153</lpage>. <pub-id pub-id-type="doi">10.1016/j.protis.2016.10.005</pub-id> <pub-id pub-id-type="pmid">28104538</pub-id></citation></ref>
<ref id="B33"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>D&#x0142;u&#x017C;ewska</surname> <given-names>J.</given-names></name> <name><surname>Szyman&#x00EC;ska</surname> <given-names>R.</given-names></name> <name><surname>Gabruk</surname> <given-names>M.</given-names></name> <name><surname>Ko&#x00EC;s</surname> <given-names>P. B.</given-names></name> <name><surname>Nowicka</surname> <given-names>B.</given-names></name> <name><surname>Kruk</surname> <given-names>J.</given-names></name></person-group> (<year>2016</year>). <article-title>Tocopherol cyclases- substrate specificity and phylogenetic relations.</article-title> <source><italic>PLoS One</italic></source> <volume>11</volume>:<issue>0159629</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0159629</pub-id> <pub-id pub-id-type="pmid">27462710</pub-id></citation></ref>
<ref id="B34"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dobin</surname> <given-names>A.</given-names></name> <name><surname>Davis</surname> <given-names>C. A.</given-names></name> <name><surname>Schlesinger</surname> <given-names>F.</given-names></name> <name><surname>Drenkow</surname> <given-names>J.</given-names></name> <name><surname>Zaleski</surname> <given-names>C.</given-names></name> <name><surname>Jha</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>STAR: ultrafast universal RNA-seq aligner.</article-title> <source><italic>Bioinformat.</italic></source> <volume>29</volume> <fpage>15</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts635</pub-id> <pub-id pub-id-type="pmid">23104886</pub-id></citation></ref>
<ref id="B35"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Azuma</surname> <given-names>T.</given-names></name> <name><surname>Nomura</surname> <given-names>M.</given-names></name> <name><surname>Audren de Kerdrel</surname> <given-names>G.</given-names></name> <name><surname>Paoli</surname> <given-names>L.</given-names></name> <name><surname>Yang</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Principles of plastid reductive evolution illuminated by nonphotosynthetic chrysophytes.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>116</volume> <fpage>6914</fpage>&#x2013;<lpage>6923</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1819976116</pub-id> <pub-id pub-id-type="pmid">30872488</pub-id></citation></ref>
<ref id="B36"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name></person-group> (<year>2017</year>). <article-title>Secondary plastids of stramenopiles.</article-title> <source><italic>Adv. Bot. Res.</italic></source> <volume>84</volume> <fpage>59</fpage>&#x2013;<lpage>103</lpage>.</citation></ref>
<ref id="B37"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Gile</surname> <given-names>G.</given-names></name> <name><surname>McCallum</surname> <given-names>G.</given-names></name> <name><surname>M&#x00E9;heust</surname> <given-names>R.</given-names></name> <name><surname>Bapteste</surname> <given-names>E. P.</given-names></name> <name><surname>Klinger</surname> <given-names>C. M.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Chimeric origins of ochrophytes and haptophytes revealed through an ancient plastid proteome.</article-title> <source><italic>eLife</italic></source> <volume>6</volume> <issue>23717</issue>. <pub-id pub-id-type="doi">10.7554/eLife.23717</pub-id> <pub-id pub-id-type="pmid">28498102</pub-id></citation></ref>
<ref id="B38"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Egue</surname> <given-names>F.</given-names></name> <name><surname>Chenais</surname> <given-names>B.</given-names></name> <name><surname>Tastard</surname> <given-names>E.</given-names></name> <name><surname>Marchand</surname> <given-names>J.</given-names></name> <name><surname>Hiard</surname> <given-names>S.</given-names></name> <name><surname>Gateau</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Expression of the retrotransposons Surcouf and Blackbeard in the marine diatom <italic>Phaeodactylum tricornutum</italic> under thermal stress.</article-title> <source><italic>Phycologia</italic></source> <volume>54</volume> <fpage>617</fpage>-<lpage>627</lpage>.</citation></ref>
<ref id="B39"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Field</surname> <given-names>C. B.</given-names></name> <name><surname>Behrenfeld</surname> <given-names>M. J.</given-names></name> <name><surname>Randerson</surname> <given-names>J. T.</given-names></name> <name><surname>Falkowski</surname> <given-names>P.</given-names></name></person-group> (<year>1998</year>). <article-title>Primary production of the biosphere: integrating terrestrial and oceanic components.</article-title> <source><italic>Science</italic></source> <volume>281</volume> <fpage>237</fpage>&#x2013;<lpage>240</lpage>. <pub-id pub-id-type="doi">10.1126/science.281.5374.237</pub-id> <pub-id pub-id-type="pmid">9657713</pub-id></citation></ref>
<ref id="B40"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Frommolt</surname> <given-names>R.</given-names></name> <name><surname>Werner</surname> <given-names>S.</given-names></name> <name><surname>Paulsen</surname> <given-names>H.</given-names></name> <name><surname>Goss</surname> <given-names>R.</given-names></name> <name><surname>Wilhelm</surname> <given-names>C.</given-names></name> <name><surname>Zauner</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2008</year>). <article-title>Ancient recruitment by chromists of green algal genes encoding enzymes for carotenoid biosynthesis.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>25</volume> <fpage>2653</fpage>&#x2013;<lpage>2667</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msn206</pub-id> <pub-id pub-id-type="pmid">18799712</pub-id></citation></ref>
<ref id="B41"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Fukasawa</surname> <given-names>Y.</given-names></name> <name><surname>Tsuji</surname> <given-names>J.</given-names></name> <name><surname>Fu</surname> <given-names>S. C.</given-names></name> <name><surname>Tomii</surname> <given-names>K.</given-names></name> <name><surname>Horton</surname> <given-names>P.</given-names></name> <name><surname>Imai</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>MitoFates: improved prediction of mitochondrial targeting sequences and their cleavage sites.</article-title> <source><italic>Mol. Cell. Proteom.</italic></source> <volume>14</volume> <fpage>1113</fpage>&#x2013;<lpage>1126</lpage>. <pub-id pub-id-type="doi">10.1074/mcp.M114.043083</pub-id> <pub-id pub-id-type="pmid">25670805</pub-id></citation></ref>
<ref id="B42"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gasch</surname> <given-names>A. P.</given-names></name> <name><surname>Eisen</surname> <given-names>M. B.</given-names></name></person-group> (<year>2002</year>). <article-title>Exploring the conditional co-regulation of yeast gene expression through fuzzy k-means clustering.</article-title> <source><italic>Genom. Biol.</italic></source> <volume>3</volume>:<issue>0059</issue>. <pub-id pub-id-type="doi">10.1186/gb-2002-3-11-research0059</pub-id> <pub-id pub-id-type="pmid">12429058</pub-id></citation></ref>
<ref id="B43"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gile</surname> <given-names>G. H.</given-names></name> <name><surname>Moog</surname> <given-names>D.</given-names></name> <name><surname>Slamovits</surname> <given-names>C. H.</given-names></name> <name><surname>Maier</surname> <given-names>U. G.</given-names></name> <name><surname>Archibald</surname> <given-names>J. M.</given-names></name></person-group> (<year>2015</year>). <article-title>Dual organellar targeting of aminoacyl-tRNA synthetases in diatoms and cryptophytes.</article-title> <source><italic>Genom. Biol. Evol.</italic></source> <volume>7</volume> <fpage>1728</fpage>&#x2013;<lpage>1742</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evv095</pub-id> <pub-id pub-id-type="pmid">25994931</pub-id></citation></ref>
<ref id="B44"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Glasser</surname> <given-names>G. J.</given-names></name> <name><surname>Winter</surname> <given-names>R. F.</given-names></name></person-group> (<year>1961</year>). <article-title>Critical values of the coefficient of rank correlation for testing the hypothesis of independence.</article-title> <source><italic>Biometrika</italic></source> <volume>48</volume> <fpage>444</fpage>&#x2013;<lpage>448</lpage>. <pub-id pub-id-type="doi">10.2307/2332767</pub-id></citation></ref>
<ref id="B45"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Grouneva</surname> <given-names>I.</given-names></name> <name><surname>Rokka</surname> <given-names>A.</given-names></name> <name><surname>Aro</surname> <given-names>E. M.</given-names></name></person-group> (<year>2011</year>). <article-title>The thylakoid membrane proteome of two marine diatoms outlines both diatom-specific and species-specific features of the photosynthetic machinery.</article-title> <source><italic>J. Proteom. Res.</italic></source> <volume>10</volume> <fpage>5338</fpage>&#x2013;<lpage>5353</lpage>. <pub-id pub-id-type="doi">10.1021/pr200600f</pub-id> <pub-id pub-id-type="pmid">22017178</pub-id></citation></ref>
<ref id="B46"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gruber</surname> <given-names>A.</given-names></name> <name><surname>Rocap</surname> <given-names>G.</given-names></name> <name><surname>Kroth</surname> <given-names>P. G.</given-names></name> <name><surname>Armbrust</surname> <given-names>E. V.</given-names></name> <name><surname>Mock</surname> <given-names>T.</given-names></name></person-group> (<year>2015</year>). <article-title>Plastid proteome prediction for diatoms and other algae with secondary plastids of the red lineage.</article-title> <source><italic>Plant J.</italic></source> <volume>81</volume> <fpage>519</fpage>&#x2013;<lpage>528</lpage>. <pub-id pub-id-type="doi">10.1111/tpj.12734</pub-id> <pub-id pub-id-type="pmid">25438865</pub-id></citation></ref>
<ref id="B47"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gschloessl</surname> <given-names>B.</given-names></name> <name><surname>Guermeur</surname> <given-names>Y.</given-names></name> <name><surname>Cock</surname> <given-names>J. M.</given-names></name></person-group> (<year>2008</year>). <article-title>HECTAR: a method to predict subcellular targeting in heterokonts.</article-title> <source><italic>BMC Bioinformat.</italic></source> <volume>9</volume>:<issue>393</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-9-393</pub-id> <pub-id pub-id-type="pmid">18811941</pub-id></citation></ref>
<ref id="B48"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Guidi</surname> <given-names>L.</given-names></name> <name><surname>Chaffron</surname> <given-names>S.</given-names></name> <name><surname>Bittner</surname> <given-names>L.</given-names></name> <name><surname>Eveillard</surname> <given-names>D.</given-names></name> <name><surname>Larhlimi</surname> <given-names>A.</given-names></name> <name><surname>Roux</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Plankton networks driving carbon export in the oligotrophic ocean.</article-title> <source><italic>Nature</italic></source> <volume>532</volume> <fpage>465</fpage>&#x2013;<lpage>470</lpage>. <pub-id pub-id-type="doi">10.1038/nature16942</pub-id> <pub-id pub-id-type="pmid">26863193</pub-id></citation></ref>
<ref id="B49"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Gundermann</surname> <given-names>K.</given-names></name> <name><surname>Schmidt</surname> <given-names>M.</given-names></name> <name><surname>Weisheit</surname> <given-names>W.</given-names></name> <name><surname>Mittag</surname> <given-names>M.</given-names></name> <name><surname>B&#x00FC;chel</surname> <given-names>C.</given-names></name></person-group> (<year>2013</year>). <article-title>Identification of several sub-populations in the pool of light harvesting proteins in the pennate diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Biochim. Biophys. Acta.</italic></source> <volume>1827</volume> <fpage>303</fpage>&#x2013;<lpage>310</lpage>. <pub-id pub-id-type="doi">10.1016/j.bbabio.2012.10.017</pub-id> <pub-id pub-id-type="pmid">23142526</pub-id></citation></ref>
<ref id="B50"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Helliwell</surname> <given-names>K. E.</given-names></name> <name><surname>Wheeler</surname> <given-names>G. L.</given-names></name> <name><surname>Leptos</surname> <given-names>K. C.</given-names></name> <name><surname>Goldstein</surname> <given-names>R. E.</given-names></name> <name><surname>Smith</surname> <given-names>A. G.</given-names></name></person-group> (<year>2011</year>). <article-title>Insights into the evolution of vitamin B12 auxotrophy from sequenced algal genomes.</article-title> <source><italic>Mol. Biol. Evol.</italic></source> <volume>28</volume> <fpage>2921</fpage>&#x2013;<lpage>2933</lpage>. <pub-id pub-id-type="doi">10.1093/molbev/msr124</pub-id> <pub-id pub-id-type="pmid">21551270</pub-id></citation></ref>
<ref id="B51"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Horton</surname> <given-names>P.</given-names></name> <name><surname>Park</surname> <given-names>K. J.</given-names></name> <name><surname>Obayashi</surname> <given-names>T.</given-names></name> <name><surname>Fujita</surname> <given-names>N.</given-names></name> <name><surname>Harada</surname> <given-names>H.</given-names></name> <name><surname>Adams-Collier</surname> <given-names>C. J.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>WoLF PSORT: protein localization predictor.</article-title> <source><italic>Nucl. Acids Res.</italic></source> <volume>35</volume> <fpage>585</fpage>&#x2013;<lpage>587</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkm259</pub-id> <pub-id pub-id-type="pmid">17517783</pub-id></citation></ref>
<ref id="B52"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huelsenbeck</surname> <given-names>J. P.</given-names></name> <name><surname>Ronquist</surname> <given-names>F.</given-names></name></person-group> (<year>2001</year>). <article-title>MRBAYES: bayesian inference of phylogenetic trees.</article-title> <source><italic>Bioinformatics</italic></source> <volume>17</volume> <fpage>754</fpage>&#x2013;<lpage>755</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/17.8.754</pub-id> <pub-id pub-id-type="pmid">11524383</pub-id></citation></ref>
<ref id="B53"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Hunsperger</surname> <given-names>H. M.</given-names></name> <name><surname>Ford</surname> <given-names>C. J.</given-names></name> <name><surname>Miller</surname> <given-names>J. S.</given-names></name> <name><surname>Cattolico</surname> <given-names>R. A.</given-names></name></person-group> (<year>2016</year>). <article-title>Differential regulation of duplicate light-dependent protochlorophyllide oxidoreductases in the diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>PLoS One</italic></source> <volume>11</volume>:<issue>0158614</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0158614</pub-id> <pub-id pub-id-type="pmid">27367227</pub-id></citation></ref>
<ref id="B54"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Huysman</surname> <given-names>M. J.</given-names></name> <name><surname>Fortunato</surname> <given-names>A. E.</given-names></name> <name><surname>Matthijs</surname> <given-names>M.</given-names></name> <name><surname>Costa</surname> <given-names>B. S.</given-names></name> <name><surname>Vanderhaeghen</surname> <given-names>R.</given-names></name> <name><surname>Van den Daele</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>AUREOCHROME1a-mediated induction of the diatom-specific cyclin dsCYC2 controls the onset of cell division in diatoms (<italic>Phaeodactylum tricornutum</italic>).</article-title> <source><italic>Plant Cell</italic></source> <volume>25</volume> <fpage>215</fpage>&#x2013;<lpage>228</lpage>. <pub-id pub-id-type="doi">10.1105/tpc.112.106377</pub-id> <pub-id pub-id-type="pmid">23292736</pub-id></citation></ref>
<ref id="B55"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kanehisa</surname> <given-names>M.</given-names></name></person-group> (<year>2017</year>). <article-title>Enzyme Annotation and Metabolic Reconstruction Using KEGG.</article-title> <source><italic>Methods Mol. Biol.</italic></source> <volume>1611</volume> <fpage>135</fpage>&#x2013;<lpage>145</lpage>. <pub-id pub-id-type="doi">10.1007/978-1-4939-7015-5_11</pub-id></citation></ref>
<ref id="B56"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kanehisa</surname> <given-names>M.</given-names></name> <name><surname>Sato</surname> <given-names>Y.</given-names></name></person-group> (<year>2020</year>). <article-title>KEGG Mapper for inferring cellular functions from protein sequences.</article-title> <source><italic>Protein Sci.</italic></source> <volume>29</volume> <fpage>28</fpage>&#x2013;<lpage>35</lpage>. <pub-id pub-id-type="doi">10.1002/pro.3711</pub-id> <pub-id pub-id-type="pmid">31423653</pub-id></citation></ref>
<ref id="B57"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Katoh</surname> <given-names>K.</given-names></name> <name><surname>Misawa</surname> <given-names>K.</given-names></name> <name><surname>Kuma</surname> <given-names>K.-I.</given-names></name> <name><surname>Miyata</surname> <given-names>T.</given-names></name></person-group> (<year>2002</year>). <article-title>MAFFT: a novel method for rapid multiple sequence alignment based on fast Fourier transform.</article-title> <source><italic>Nucl. Acids Res.</italic></source> <volume>30</volume> <fpage>3059</fpage>&#x2013;<lpage>3066</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkf436</pub-id> <pub-id pub-id-type="pmid">12136088</pub-id></citation></ref>
<ref id="B58"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kazamia</surname> <given-names>E.</given-names></name> <name><surname>Sutak</surname> <given-names>R.</given-names></name> <name><surname>Paz-Yepes</surname> <given-names>J.</given-names></name> <name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Vieira</surname> <given-names>F. R. J.</given-names></name> <name><surname>Mach</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Endocytosis-mediated siderophore uptake as a strategy for Fe acquisition in diatoms.</article-title> <source><italic>Sci. Adv.</italic></source> <volume>16</volume>:<issue>5</issue>. <pub-id pub-id-type="doi">10.1126/sciadv.aar4536</pub-id> <pub-id pub-id-type="pmid">29774236</pub-id></citation></ref>
<ref id="B59"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kearse</surname> <given-names>M.</given-names></name> <name><surname>Moir</surname> <given-names>R.</given-names></name> <name><surname>Wilson</surname> <given-names>A.</given-names></name> <name><surname>Stones-Havas</surname> <given-names>S.</given-names></name> <name><surname>Cheung</surname> <given-names>M.</given-names></name> <name><surname>Sturrock</surname> <given-names>S.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Geneious Basic: an integrated and extendable desktop software platform for the organization and analysis of sequence data.</article-title> <source><italic>Bioinformatics</italic></source> <volume>28</volume> <fpage>1647</fpage>&#x2013;<lpage>1649</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/bts199</pub-id> <pub-id pub-id-type="pmid">22543367</pub-id></citation></ref>
<ref id="B60"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Keeling</surname> <given-names>P. J.</given-names></name> <name><surname>Burki</surname> <given-names>F.</given-names></name> <name><surname>Wilcox</surname> <given-names>H. M.</given-names></name> <name><surname>Allam</surname> <given-names>B.</given-names></name> <name><surname>Allen</surname> <given-names>E. E.</given-names></name> <name><surname>Amaral-Zettler</surname> <given-names>L. A.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>The marine microbial eukaryote transcriptome sequencing project (MMETSP): illuminating the functional diversity of eukaryotic life in the oceans through transcriptome sequencing.</article-title> <source><italic>PLoS Biol.</italic></source> <volume>10</volume>:<issue>1001889</issue>. <pub-id pub-id-type="doi">10.1073/pnas.1603112113</pub-id> <pub-id pub-id-type="pmid">27531955</pub-id></citation></ref>
<ref id="B61"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kikutani</surname> <given-names>S.</given-names></name> <name><surname>Nakajima</surname> <given-names>K.</given-names></name> <name><surname>Nagasato</surname> <given-names>C.</given-names></name> <name><surname>Tsuji</surname> <given-names>Y.</given-names></name> <name><surname>Miyatake</surname> <given-names>A.</given-names></name> <name><surname>Matsuda</surname> <given-names>Y.</given-names></name></person-group> (<year>2016</year>). <article-title>Thylakoid luminal theta-carbonic anhydrase critical for growth and photosynthesis in the marine diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>113</volume> <fpage>9828</fpage>&#x2013;<lpage>9833</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1603112113</pub-id> <pub-id pub-id-type="pmid">27531955</pub-id></citation></ref>
<ref id="B62"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kim</surname> <given-names>E.-D.</given-names></name> <name><surname>Sung</surname> <given-names>S.</given-names></name></person-group> (<year>2012</year>). <article-title>Long noncoding RNA: unveiling hidden layer of gene regulatory networks.</article-title> <source><italic>Trends Plant Sci.</italic></source> <volume>17</volume> <fpage>16</fpage>&#x2013;<lpage>21</lpage>. <pub-id pub-id-type="doi">10.1016/j.tplants.2011.10.008</pub-id> <pub-id pub-id-type="pmid">22104407</pub-id></citation></ref>
<ref id="B63"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kroth</surname> <given-names>P. G.</given-names></name> <name><surname>Chiovitti</surname> <given-names>A.</given-names></name> <name><surname>Gruber</surname> <given-names>A.</given-names></name> <name><surname>Martin-Jezequel</surname> <given-names>V.</given-names></name> <name><surname>Mock</surname> <given-names>T.</given-names></name> <name><surname>Parker</surname> <given-names>M. S.</given-names></name></person-group> (<year>2008</year>). <article-title>A model for carbohydrate metabolism in the diatom <italic>Phaeodactylum tricornutum</italic> deduced from comparative whole genome analysis.</article-title> <source><italic>PLoS One</italic></source> <volume>3</volume>:<issue>e1426</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0001426</pub-id> <pub-id pub-id-type="pmid">18183306</pub-id></citation></ref>
<ref id="B64"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kroth</surname> <given-names>P. G.</given-names></name> <name><surname>Wilhelm</surname> <given-names>C.</given-names></name> <name><surname>Kottke</surname> <given-names>T.</given-names></name></person-group> (<year>2017</year>). <article-title>An update on aureochromes: phylogeny - mechanism - function.</article-title> <source><italic>J. Plant Physiol.</italic></source> <volume>217</volume> <fpage>20</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1016/j.jplph.2017.06.010</pub-id> <pub-id pub-id-type="pmid">28797596</pub-id></citation></ref>
<ref id="B65"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Kustka</surname> <given-names>A.</given-names></name> <name><surname>Milligan</surname> <given-names>A. J.</given-names></name> <name><surname>Zheng</surname> <given-names>H.</given-names></name> <name><surname>New</surname> <given-names>A. M.</given-names></name> <name><surname>Gates</surname> <given-names>C.</given-names></name> <name><surname>Bidle</surname> <given-names>K. D.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>Low CO2 results in a rearrangement of carbon metabolism to support C4 photosynthetic carbon assimilation in Thalassiosira pseudonana.</article-title> <source><italic>New Phytol.</italic></source> <volume>204</volume> <fpage>507</fpage>&#x2013;<lpage>520</lpage>. <pub-id pub-id-type="doi">10.1111/nph.12926</pub-id> <pub-id pub-id-type="pmid">25046577</pub-id></citation></ref>
<ref id="B66"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Lampe</surname> <given-names>R. H.</given-names></name> <name><surname>Mann</surname> <given-names>E. L.</given-names></name> <name><surname>Cohen</surname> <given-names>N. R.</given-names></name> <name><surname>Till</surname> <given-names>C. P.</given-names></name> <name><surname>Thamatrakoln</surname> <given-names>K.</given-names></name> <name><surname>Brzezinski</surname> <given-names>M. A.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Different iron storage strategies among bloom-forming diatoms.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A</italic></source> <volume>115</volume> <fpage>12275</fpage>&#x2013;<lpage>12284</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.1805243115</pub-id> <pub-id pub-id-type="pmid">30538208</pub-id></citation></ref>
<ref id="B67"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Langfelder</surname> <given-names>P.</given-names></name> <name><surname>Horvath</surname> <given-names>S.</given-names></name></person-group> (<year>2008</year>). <article-title>WGCNA: an R package for weighted correlation network analysis.</article-title> <source><italic>BMC Bioinformat.</italic></source> <volume>9</volume>:<issue>559</issue>. <pub-id pub-id-type="doi">10.1186/1471-2105-9-559</pub-id> <pub-id pub-id-type="pmid">19114008</pub-id></citation></ref>
<ref id="B68"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Levering</surname> <given-names>J.</given-names></name> <name><surname>Broddrick</surname> <given-names>J.</given-names></name> <name><surname>Dupont</surname> <given-names>C. L.</given-names></name> <name><surname>Peers</surname> <given-names>G.</given-names></name> <name><surname>Beeri</surname> <given-names>K.</given-names></name> <name><surname>Mayers</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Genome-scale model reveals metabolic basis of biomass partitioning in a model diatom.</article-title> <source><italic>PLoS One</italic></source> <volume>11</volume>:<issue>0155038</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0155038</pub-id> <pub-id pub-id-type="pmid">27152931</pub-id></citation></ref>
<ref id="B69"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Li</surname> <given-names>X.</given-names></name> <name><surname>Patena</surname> <given-names>W.</given-names></name> <name><surname>Fauser</surname> <given-names>F.</given-names></name> <name><surname>Jinkerson</surname> <given-names>R. E.</given-names></name> <name><surname>Saroussi</surname> <given-names>S.</given-names></name> <name><surname>Meyer</surname> <given-names>M. T.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>A genome-wide algal mutant library reveals a global view of genes required for eukaryotic photosynthesis</article-title>. <source><italic>Nat. Genet.</italic></source> <volume>1</volume>, <fpage>627</fpage>&#x2013;<lpage>635</lpage>. <pub-id pub-id-type="doi">10.1038/s41588-019-0370-6</pub-id> <pub-id pub-id-type="pmid">30886426</pub-id></citation></ref>
<ref id="B70"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Liao</surname> <given-names>Y.</given-names></name> <name><surname>Smyth</surname> <given-names>G. K.</given-names></name> <name><surname>Shi</surname> <given-names>W.</given-names></name></person-group> (<year>2014</year>). <article-title>featureCounts: an efficient general purpose program for assigning sequence reads to genomic features.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>923</fpage>&#x2013;<lpage>930</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btt656</pub-id> <pub-id pub-id-type="pmid">24227677</pub-id></citation></ref>
<ref id="B71"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Love</surname> <given-names>M. I.</given-names></name> <name><surname>Huber</surname> <given-names>W.</given-names></name> <name><surname>Anders</surname> <given-names>S.</given-names></name></person-group> (<year>2014</year>). <article-title>Moderated estimation of fold change and dispersion for RNA-seq data with DESeq2.</article-title> <source><italic>Genom. Biol.</italic></source> <volume>15</volume>:<issue>550</issue>. <pub-id pub-id-type="doi">10.1186/s13059-014-0550-8</pub-id> <pub-id pub-id-type="pmid">25516281</pub-id></citation></ref>
<ref id="B72"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maheswari</surname> <given-names>U.</given-names></name> <name><surname>Jabbari</surname> <given-names>K.</given-names></name> <name><surname>Petit</surname> <given-names>J.-L.</given-names></name> <name><surname>Porcel</surname> <given-names>B. M.</given-names></name> <name><surname>Allen</surname> <given-names>A. E.</given-names></name> <name><surname>Cadoret</surname> <given-names>J.-P.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Digital expression profiling of novel diatom transcripts provides insight into their biological functions.</article-title> <source><italic>Genom. Biol.</italic></source> <volume>11</volume>:<issue>85</issue>. <pub-id pub-id-type="doi">10.1186/gb-2010-11-8-r85</pub-id> <pub-id pub-id-type="pmid">20738856</pub-id></citation></ref>
<ref id="B73"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mann</surname> <given-names>M.</given-names></name> <name><surname>Serif</surname> <given-names>M.</given-names></name> <name><surname>Jakob</surname> <given-names>T.</given-names></name> <name><surname>Kroth</surname> <given-names>P. G.</given-names></name> <name><surname>Wilhelm</surname> <given-names>C.</given-names></name></person-group> (<year>2017</year>). <article-title>PtAUREO1a and PtAUREO1b knockout mutants of the diatom <italic>Phaeodactylum tricornutum</italic> are blocked in photoacclimation to blue light.</article-title> <source><italic>J. Plant Physiol.</italic></source> <volume>217</volume> <fpage>44</fpage>&#x2013;<lpage>48</lpage>. <pub-id pub-id-type="doi">10.1016/j.jplph.2017.05.020</pub-id> <pub-id pub-id-type="pmid">28610707</pub-id></citation></ref>
<ref id="B74"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Mar&#x00E9;chal</surname> <given-names>E.</given-names></name> <name><surname>Lupette</surname> <given-names>J.</given-names></name></person-group> (<year>2020</year>). <article-title>Relationship between acyl-lipid and sterol metabolisms in diatoms.</article-title> <source><italic>Biochimie</italic></source> <volume>169</volume> <fpage>3</fpage>&#x2013;<lpage>11</lpage>. <pub-id pub-id-type="doi">10.1016/j.biochi.2019.07.005</pub-id> <pub-id pub-id-type="pmid">31291593</pub-id></citation></ref>
<ref id="B75"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Maxwell Burroughs</surname> <given-names>A.</given-names></name> <name><surname>Aravind</surname> <given-names>L.</given-names></name></person-group> (<year>2014</year>). <article-title>A highly conserved family of domains related to the DNA-glycosylase fold helps predict multiple novel pathways for RNA modifications.</article-title> <source><italic>RNA Biol.</italic></source> <volume>11</volume> <fpage>360</fpage>&#x2013;<lpage>372</lpage>. <pub-id pub-id-type="doi">10.4161/rna.28302</pub-id> <pub-id pub-id-type="pmid">24646681</pub-id></citation></ref>
<ref id="B76"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>McCarthy</surname> <given-names>J. K.</given-names></name> <name><surname>Smith</surname> <given-names>S. R.</given-names></name> <name><surname>McCrow</surname> <given-names>J. P.</given-names></name> <name><surname>Tan</surname> <given-names>M.</given-names></name> <name><surname>Zheng</surname> <given-names>H.</given-names></name> <name><surname>Beeri</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2017</year>). <article-title>Nitrate reductase knockout uncouples nitrate transport from nitrate assimilation and drives repartitioning of carbon flux in a model pennate diatom.</article-title> <source><italic>Plant Cell</italic></source> <volume>29</volume> <fpage>2047</fpage>&#x2013;<lpage>2070</lpage>. <pub-id pub-id-type="doi">10.1105/tpc.16.00910</pub-id> <pub-id pub-id-type="pmid">28765511</pub-id></citation></ref>
<ref id="B77"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Michalak</surname> <given-names>P.</given-names></name></person-group> (<year>2008</year>). <article-title>Coexpression, co-regulation and cofunctionality of neighboring genes in eukaryotic genomes.</article-title> <source><italic>Genomics</italic></source> <volume>91</volume> <fpage>243</fpage>&#x2013;<lpage>248</lpage>. <pub-id pub-id-type="doi">10.1016/j.ygeno.2007.11.002</pub-id> <pub-id pub-id-type="pmid">18082363</pub-id></citation></ref>
<ref id="B78"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Monnier</surname> <given-names>A.</given-names></name> <name><surname>Liverani</surname> <given-names>S.</given-names></name> <name><surname>Bouvet</surname> <given-names>R.</given-names></name> <name><surname>Jesson</surname> <given-names>B.</given-names></name> <name><surname>Smith</surname> <given-names>J. Q.</given-names></name> <name><surname>Mosser</surname> <given-names>J.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Orchestrated transcription of biological processes in the marine picoeukaryote Ostreococcus exposed to light/dark cycles.</article-title> <source><italic>BMC Genom</italic></source> <volume>11</volume>:<issue>192</issue>. <pub-id pub-id-type="doi">10.1186/1471-2164-11-192</pub-id> <pub-id pub-id-type="pmid">20307298</pub-id></citation></ref>
<ref id="B79"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Morey</surname> <given-names>M.</given-names></name> <name><surname>Fern&#x00E1;ndez-Marmiesse</surname> <given-names>A.</given-names></name> <name><surname>Casti&#x00F1;eiras</surname> <given-names>D.</given-names></name> <name><surname>Fraga</surname> <given-names>J.</given-names></name> <name><surname>Couce</surname> <given-names>M. L.</given-names></name> <name><surname>Cocho</surname> <given-names>J. A.</given-names></name></person-group> (<year>2013</year>). <article-title>A glimpse into past, present and future DNA sequencing.</article-title> <source><italic>Mol. Genet. Metab.</italic></source> <volume>110</volume> <fpage>3</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.1016/j.ymgme.2013.04.024</pub-id> <pub-id pub-id-type="pmid">23742747</pub-id></citation></ref>
<ref id="B80"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Moriya</surname> <given-names>Y.</given-names></name> <name><surname>Itoh</surname> <given-names>M.</given-names></name> <name><surname>Okuda</surname> <given-names>S.</given-names></name> <name><surname>Yoshizawa</surname> <given-names>A. C.</given-names></name> <name><surname>Kanehisa</surname> <given-names>M.</given-names></name></person-group> (<year>2007</year>). <article-title>KAAS: an automatic genome annotation and pathway reconstruction server.</article-title> <source><italic>Nucl. Acids Res.</italic></source> <volume>35</volume> <fpage>182</fpage>&#x2013;<lpage>185</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkm321</pub-id> <pub-id pub-id-type="pmid">17526522</pub-id></citation></ref>
<ref id="B81"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Murik</surname> <given-names>O.</given-names></name> <name><surname>Tirichine</surname> <given-names>L.</given-names></name> <name><surname>Prihoda</surname> <given-names>J.</given-names></name> <name><surname>Thomas</surname> <given-names>Y.</given-names></name> <name><surname>Ara&#x00FA;jo</surname> <given-names>W. L.</given-names></name> <name><surname>Allen</surname> <given-names>A. E.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Downregulation of mitochondrial alternative oxidase affects chloroplast function, redox status and stress response in a marine diatom.</article-title> <source><italic>New Phytol.</italic></source> <volume>221</volume> <fpage>1303</fpage>&#x2013;<lpage>1316</lpage>. <pub-id pub-id-type="doi">10.1111/nph.15479</pub-id> <pub-id pub-id-type="pmid">30216452</pub-id></citation></ref>
<ref id="B82"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nonoyama</surname> <given-names>T.</given-names></name> <name><surname>Kazamia</surname> <given-names>E.</given-names></name> <name><surname>Nawaly</surname> <given-names>H.</given-names></name> <name><surname>Gao</surname> <given-names>X.</given-names></name> <name><surname>Tsuji</surname> <given-names>Y.</given-names></name> <name><surname>Matsuda</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Metabolic innovations underpinning the origin and diversification of the diatom chloroplast.</article-title> <source><italic>Biomolecules</italic></source> <volume>9</volume>:<issue>322</issue>. <pub-id pub-id-type="doi">10.3390/biom9080322</pub-id> <pub-id pub-id-type="pmid">31366180</pub-id></citation></ref>
<ref id="B83"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Noordally</surname> <given-names>Z. B.</given-names></name> <name><surname>Ishii</surname> <given-names>K.</given-names></name> <name><surname>Atkins</surname> <given-names>K. A.</given-names></name> <name><surname>Wetherill</surname> <given-names>S. J.</given-names></name> <name><surname>Kusakina</surname> <given-names>J.</given-names></name> <name><surname>Walton</surname> <given-names>E. J.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Circadian control of chloroplast transcription by a nuclear-encoded timing signal.</article-title> <source><italic>Science</italic></source> <volume>339</volume> <fpage>1316</fpage>&#x2013;<lpage>1319</lpage>. <pub-id pub-id-type="doi">10.1126/science.1230397</pub-id> <pub-id pub-id-type="pmid">23493713</pub-id></citation></ref>
<ref id="B84"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Norbury</surname> <given-names>C. J.</given-names></name></person-group> (<year>2010</year>). <article-title>3&#x2019; uridylation and the regulation of RNA function in the cytoplasm.</article-title> <source><italic>Biochem. Soc. Trans.</italic></source> <volume>38</volume> <fpage>1150</fpage>&#x2013;<lpage>1153</lpage>. <pub-id pub-id-type="doi">10.1042/bst0381150</pub-id> <pub-id pub-id-type="pmid">20659020</pub-id></citation></ref>
<ref id="B85"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Nov&#x00E1;k Vanclov&#x00E1;</surname> <given-names>A. M. G.</given-names></name> <name><surname>Zoltner</surname> <given-names>M.</given-names></name> <name><surname>Kelly</surname> <given-names>S.</given-names></name> <name><surname>Soukal</surname> <given-names>P.</given-names></name> <name><surname>Z&#x00E1;honov&#x00E1;</surname> <given-names>K.</given-names></name> <name><surname>F&#x00FC;ssy</surname> <given-names>Z.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Metabolic quirks and the colourful history of the Euglena gracilis secondary plastid.</article-title> <source><italic>New Phytol.</italic></source> <volume>225</volume> <fpage>1578</fpage>&#x2013;<lpage>1592</lpage>. <pub-id pub-id-type="doi">10.1111/nph.16237</pub-id> <pub-id pub-id-type="pmid">31580486</pub-id></citation></ref>
<ref id="B86"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Osborn</surname> <given-names>H. L.</given-names></name> <name><surname>Hook</surname> <given-names>S. E.</given-names></name></person-group> (<year>2013</year>). <article-title>Using transcriptomic profiles in the diatom <italic>Phaeodactylum tricornutum</italic> to identify and prioritize stressors.</article-title> <source><italic>Aquat. Toxicol.</italic></source> <volume>13</volume> <fpage>12</fpage>&#x2013;<lpage>25</lpage>. <pub-id pub-id-type="doi">10.1016/j.aquatox.2013.04.002</pub-id> <pub-id pub-id-type="pmid">23680677</pub-id></citation></ref>
<ref id="B87"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oudot-Le Secq</surname> <given-names>M. P.</given-names></name> <name><surname>Green</surname> <given-names>B. R.</given-names></name></person-group> (<year>2011</year>). <article-title>Complex repeat structures and novel features in the mitochondrial genomes of the diatoms <italic>Phaeodactylum tricornutum</italic> and Thalassiosira pseudonana.</article-title> <source><italic>Gene</italic></source> <volume>476</volume> <fpage>20</fpage>&#x2013;<lpage>26</lpage>. <pub-id pub-id-type="doi">10.1016/j.gene.2011.02.001</pub-id> <pub-id pub-id-type="pmid">21320580</pub-id></citation></ref>
<ref id="B88"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Oudot-Le Secq</surname> <given-names>M. P.</given-names></name> <name><surname>Grimwood</surname> <given-names>J.</given-names></name> <name><surname>Shapiro</surname> <given-names>H.</given-names></name> <name><surname>Armbrust</surname> <given-names>E. V.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name> <name><surname>Green</surname> <given-names>B. R.</given-names></name></person-group> (<year>2007</year>). <article-title>Chloroplast genomes of the diatoms <italic>Phaeodactylum tricornutum</italic> and Thalassiosira pseudonana: comparison with other plastid genomes of the red lineage.</article-title> <source><italic>Mol. Genet. Genom.</italic></source> <volume>277</volume> <fpage>427</fpage>&#x2013;<lpage>439</lpage>. <pub-id pub-id-type="doi">10.1007/s00438-006-0199-4</pub-id> <pub-id pub-id-type="pmid">17252281</pub-id></citation></ref>
<ref id="B89"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Park</surname> <given-names>B. H.</given-names></name> <name><surname>Karpinets</surname> <given-names>T. V.</given-names></name> <name><surname>Syed</surname> <given-names>M. H.</given-names></name> <name><surname>Leuze</surname> <given-names>M. R.</given-names></name> <name><surname>Uberbacher</surname> <given-names>E. C.</given-names></name></person-group> (<year>2010</year>). <article-title>CAZymes Analysis Toolkit (CAT): Web service for searching and analyzing carbohydrate-active enzymes in a newly sequenced organism using CAZy database.</article-title> <source><italic>Glycobiology</italic></source> <volume>20</volume> <fpage>1574</fpage>&#x2013;<lpage>1584</lpage>. <pub-id pub-id-type="doi">10.1093/glycob/cwq106</pub-id> <pub-id pub-id-type="pmid">20696711</pub-id></citation></ref>
<ref id="B90"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Parks</surname> <given-names>M. B.</given-names></name> <name><surname>Nakov</surname> <given-names>T.</given-names></name> <name><surname>Ruck</surname> <given-names>E. C.</given-names></name> <name><surname>Wickett</surname> <given-names>N. J.</given-names></name> <name><surname>Alverson</surname> <given-names>A. J.</given-names></name></person-group> (<year>2018</year>). <article-title>Phylogenomics reveals an extensive history of genome duplication in diatoms (Bacillariophyta).</article-title> <source><italic>Am. J. Bot.</italic></source> <volume>105</volume> <fpage>330</fpage>&#x2013;<lpage>347</lpage>. <pub-id pub-id-type="doi">10.1002/ajb2.1056</pub-id> <pub-id pub-id-type="pmid">29665021</pub-id></citation></ref>
<ref id="B91"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Prihoda</surname> <given-names>J.</given-names></name> <name><surname>Tanaka</surname> <given-names>A.</given-names></name> <name><surname>de Paula</surname> <given-names>W. B. M.</given-names></name> <name><surname>Allen</surname> <given-names>J. F.</given-names></name> <name><surname>Tirichine</surname> <given-names>L.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name></person-group> (<year>2012</year>). <article-title>Chloroplast-mitochondria cross-talk in diatoms.</article-title> <source><italic>J. Exp. Bot.</italic></source> <volume>63</volume> <fpage>1543</fpage>&#x2013;<lpage>1557</lpage>. <pub-id pub-id-type="doi">10.1093/jxb/err441</pub-id> <pub-id pub-id-type="pmid">22268145</pub-id></citation></ref>
<ref id="B92"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rastogi</surname> <given-names>A.</given-names></name> <name><surname>Maheswari</surname> <given-names>U.</given-names></name> <name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Vieira</surname> <given-names>F. R. J.</given-names></name> <name><surname>Maumus</surname> <given-names>F.</given-names></name> <name><surname>Kustka</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Integrative analysis of large scale transcriptome data draws a comprehensive landscape of <italic>Phaeodactylum tricornutum</italic> genome and evolutionary origin of diatoms.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>8</volume>:<issue>4834</issue>. <pub-id pub-id-type="doi">10.1038/s41598-018-23106-x</pub-id> <pub-id pub-id-type="pmid">29556065</pub-id></citation></ref>
<ref id="B93"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Rayko</surname> <given-names>E.</given-names></name> <name><surname>Maumus</surname> <given-names>F.</given-names></name> <name><surname>Maheswari</surname> <given-names>U.</given-names></name> <name><surname>Jabbari</surname> <given-names>K.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name></person-group> (<year>2010</year>). <article-title>Transcription factor families inferred from genome sequences of photosynthetic stramenopiles.</article-title> <source><italic>New Phytol.</italic></source> <volume>188</volume> <fpage>52</fpage>&#x2013;<lpage>66</lpage>. <pub-id pub-id-type="doi">10.1111/j.1469-8137.2010.03371.x</pub-id> <pub-id pub-id-type="pmid">20646219</pub-id></citation></ref>
<ref id="B94"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Reja</surname> <given-names>R.</given-names></name> <name><surname>Vinayachandran</surname> <given-names>V.</given-names></name> <name><surname>Ghosh</surname> <given-names>S.</given-names></name> <name><surname>Pugh</surname> <given-names>B. F.</given-names></name></person-group> (<year>2015</year>). <article-title>Molecular mechanisms of ribosomal protein gene co-regulation.</article-title> <source><italic>Genes Dev.</italic></source> <volume>29</volume> <fpage>1942</fpage>&#x2013;<lpage>1954</lpage>. <pub-id pub-id-type="doi">10.1101/gad.268896.115</pub-id> <pub-id pub-id-type="pmid">26385964</pub-id></citation></ref>
<ref id="B95"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>R&#x00ED;o B&#x00E1;rtulos</surname> <given-names>C.</given-names></name> <name><surname>Rogers</surname> <given-names>M. B.</given-names></name> <name><surname>Williams</surname> <given-names>T. A.</given-names></name> <name><surname>Gentekaki</surname> <given-names>E.</given-names></name> <name><surname>Brinkmann</surname> <given-names>H.</given-names></name> <name><surname>Cerff</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2018</year>). <article-title>Mitochondrial glycolysis in a major lineage of eukaryotes.</article-title> <source><italic>Genom. Biol. Evol.</italic></source> <volume>10</volume> <fpage>2310</fpage>&#x2013;<lpage>2325</lpage>. <pub-id pub-id-type="doi">10.1093/gbe/evy164</pub-id> <pub-id pub-id-type="pmid">30060189</pub-id></citation></ref>
<ref id="B96"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Roncel</surname> <given-names>M.</given-names></name> <name><surname>Gonzalez-Rodriguez</surname> <given-names>A. A.</given-names></name> <name><surname>Naranjo</surname> <given-names>B.</given-names></name> <name><surname>Bernal-Bayard</surname> <given-names>P.</given-names></name> <name><surname>Lindahl</surname> <given-names>A. M.</given-names></name> <name><surname>Hervas</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Iron deficiency induces a partial inhibition of the photosynthetic electron transport and a high sensitivity to light in the diatom <italic>P. tricornutum</italic>.</article-title> <source><italic>Front. Plant Sci.</italic></source> <volume>7</volume>:<issue>14</issue>. <pub-id pub-id-type="doi">10.3389/fpls.2016.01050</pub-id> <pub-id pub-id-type="pmid">27536301</pub-id></citation></ref>
<ref id="B97"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Sato</surname> <given-names>S.</given-names></name> <name><surname>Nanjappa</surname> <given-names>D.</given-names></name> <name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Vieira</surname> <given-names>F. R. J.</given-names></name> <name><surname>Kazamia</surname> <given-names>E.</given-names></name> <name><surname>Tirichine</surname> <given-names>L.</given-names></name><etal/></person-group> (<year>2020</year>). <article-title>Genome-enabled phylogenetic and functional reconstruction of an araphid pennate diatom Plagiostriata sp. <italic>CCMP</italic>470, previously assigned as a radial centric diatom and its bacterial commensal.</article-title> <source><italic>Sci. Rep.</italic></source> <volume>10</volume>:<issue>9449</issue>. <pub-id pub-id-type="doi">10.1038/s41598-020-65941-x</pub-id> <pub-id pub-id-type="pmid">32523048</pub-id></citation></ref>
<ref id="B98"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Schober</surname> <given-names>A.</given-names></name> <name><surname>R&#x00ED;o B&#x00E1;rtulos</surname> <given-names>C.</given-names></name> <name><surname>Bischoff</surname> <given-names>A.</given-names></name> <name><surname>Lepetit</surname> <given-names>B.</given-names></name> <name><surname>Gruber</surname> <given-names>A.</given-names></name> <name><surname>Kroth</surname> <given-names>P. G.</given-names></name></person-group> (<year>2019</year>). <article-title>Organelle studies and proteome analyses of mitochondria and plastids fractions from the diatom Thalassiosira pseudonana.</article-title> <source><italic>Plant Cell Physiol.</italic></source> <volume>60</volume> <fpage>1811</fpage>&#x2013;<lpage>1828</lpage>. <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.1093/pcp/pcz097">https://doi.org/10.1093/pcp/pcz097</ext-link>, <pub-id pub-id-type="doi">10.1093/pcp/pcz097</pub-id> <pub-id pub-id-type="pmid">31179502</pub-id></citation></ref>
<ref id="B99"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shadel</surname> <given-names>G. S.</given-names></name> <name><surname>Clayton</surname> <given-names>D. A.</given-names></name></person-group> (<year>1995</year>). <article-title>A Saccharomyces cerevisiae mitochondrial transcription factor, sc-mtTFB, shares features with sigma factors but is functionally distinct.</article-title> <source><italic>Mol. Cell Biol.</italic></source> <volume>15</volume> <fpage>2101</fpage>&#x2013;<lpage>2108</lpage>. <pub-id pub-id-type="doi">10.1128/mcb.15.4.2101</pub-id> <pub-id pub-id-type="pmid">7891705</pub-id></citation></ref>
<ref id="B100"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shannon</surname> <given-names>P.</given-names></name> <name><surname>Markiel</surname> <given-names>A.</given-names></name> <name><surname>Ozier</surname> <given-names>O.</given-names></name> <name><surname>Baliga</surname> <given-names>N. S.</given-names></name> <name><surname>Wang</surname> <given-names>J. T.</given-names></name> <name><surname>Ramage</surname> <given-names>D.</given-names></name><etal/></person-group> (<year>2003</year>). <article-title>Cytoscape: a software environment for integrated models of biomolecular interaction networks.</article-title> <source><italic>Genom. Res.</italic></source> <volume>13</volume> <fpage>2498</fpage>&#x2013;<lpage>2504</lpage>. <pub-id pub-id-type="doi">10.1101/gr.1239303</pub-id> <pub-id pub-id-type="pmid">14597658</pub-id></citation></ref>
<ref id="B101"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Shimizu</surname> <given-names>M.</given-names></name> <name><surname>Kato</surname> <given-names>H.</given-names></name> <name><surname>Ogawa</surname> <given-names>T.</given-names></name> <name><surname>Kurachi</surname> <given-names>A.</given-names></name> <name><surname>Nakagawa</surname> <given-names>Y.</given-names></name> <name><surname>Kobayashi</surname> <given-names>H.</given-names></name></person-group> (<year>2010</year>). <article-title>Sigma factor phosphorylation in the photosynthetic control of photosystem stoichiometry.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>107</volume> <fpage>10760</fpage>&#x2013;<lpage>10764</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0911692107</pub-id> <pub-id pub-id-type="pmid">20498041</pub-id></citation></ref>
<ref id="B102"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>S. R.</given-names></name> <name><surname>Dupont</surname> <given-names>C. L.</given-names></name> <name><surname>McCarthy</surname> <given-names>J. K.</given-names></name> <name><surname>Broddrick</surname> <given-names>J. T.</given-names></name> <name><surname>Oborn&#x00ED;k</surname> <given-names>M.</given-names></name> <name><surname>Hor&#x00E1;k</surname> <given-names>A.</given-names></name><etal/></person-group> (<year>2019</year>). <article-title>Evolution and regulation of nitrogen flux through compartmentalized metabolic networks in a marine diatom.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>10</volume>:<issue>4552</issue>. <pub-id pub-id-type="doi">10.1038/s41467-019-12407-y</pub-id> <pub-id pub-id-type="pmid">31591397</pub-id></citation></ref>
<ref id="B103"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Smith</surname> <given-names>S. R.</given-names></name> <name><surname>Gillard</surname> <given-names>J. T.</given-names></name> <name><surname>Kustka</surname> <given-names>A. B.</given-names></name> <name><surname>McCrow</surname> <given-names>J. B.</given-names></name> <name><surname>Badger</surname> <given-names>J. H.</given-names></name> <name><surname>Zheng</surname> <given-names>H.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Transcriptional orchestration of the global cellular response of a model pennate diatom to diel light cycling under iron limitation.&#x201D;.</article-title> <source><italic>PLoS Genet</italic></source> <volume>12</volume>:<issue>e1006490</issue>. <pub-id pub-id-type="doi">10.1371/journal.pgen.1006490</pub-id> <pub-id pub-id-type="pmid">27973599</pub-id></citation></ref>
<ref id="B104"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Snel</surname> <given-names>B.</given-names></name> <name><surname>van Noort</surname> <given-names>V.</given-names></name> <name><surname>Huynen</surname> <given-names>M. A.</given-names></name></person-group> (<year>2004</year>). <article-title>Gene co-regulation is highly conserved in the evolution of eukaryotes and prokaryotes.</article-title> <source><italic>Nucl. Acids Res.</italic></source> <volume>32</volume> <fpage>4725</fpage>&#x2013;<lpage>4731</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkh815</pub-id> <pub-id pub-id-type="pmid">15353560</pub-id></citation></ref>
<ref id="B105"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Stamatakis</surname> <given-names>A.</given-names></name></person-group> (<year>2014</year>). <article-title>RAxML version 8: a tool for phylogenetic analysis and post-analysis of large phylogenies.</article-title> <source><italic>Bioinformatics</italic></source> <volume>30</volume> <fpage>1312</fpage>&#x2013;<lpage>1313</lpage>. <pub-id pub-id-type="doi">10.1093/bioinformatics/btu033</pub-id> <pub-id pub-id-type="pmid">24451623</pub-id></citation></ref>
<ref id="B106"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Taddei</surname> <given-names>L.</given-names></name> <name><surname>Stella</surname> <given-names>G. R.</given-names></name> <name><surname>Rogato</surname> <given-names>A.</given-names></name> <name><surname>Bailleul</surname> <given-names>B.</given-names></name> <name><surname>Fortunato</surname> <given-names>A. E.</given-names></name> <name><surname>Annunziata</surname> <given-names>R.</given-names></name><etal/></person-group> (<year>2016</year>). <article-title>Multisignal control of expression of the LHCX protein family in the marine diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>J. Exp. Bot.</italic></source> <volume>67</volume> <fpage>3939</fpage>&#x2013;<lpage>3951</lpage>. <pub-id pub-id-type="doi">10.1093/jxb/erw198</pub-id> <pub-id pub-id-type="pmid">27225826</pub-id></citation></ref>
<ref id="B107"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Takahashi</surname> <given-names>F.</given-names></name> <name><surname>Yamagata</surname> <given-names>D.</given-names></name> <name><surname>Ishikawa</surname> <given-names>M.</given-names></name> <name><surname>Fukamatsu</surname> <given-names>Y.</given-names></name> <name><surname>Ogura</surname> <given-names>Y.</given-names></name> <name><surname>Kasahara</surname> <given-names>M.</given-names></name><etal/></person-group> (<year>2007</year>). <article-title>AUREOCHROME, a photoreceptor required for photomorphogenesis in stramenopiles.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>104</volume> <fpage>19625</fpage>&#x2013;<lpage>19630</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0707692104</pub-id> <pub-id pub-id-type="pmid">18003911</pub-id></citation></ref>
<ref id="B108"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tanaka</surname> <given-names>A.</given-names></name> <name><surname>De Martino</surname> <given-names>A.</given-names></name> <name><surname>Amato</surname> <given-names>A.</given-names></name> <name><surname>Montsant</surname> <given-names>A.</given-names></name> <name><surname>Mathieu</surname> <given-names>B.</given-names></name> <name><surname>Rostaing</surname> <given-names>P.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>Ultrastructure and membrane traffic during cell division in the marine pennate diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Protist</italic></source> <volume>166</volume> <fpage>506</fpage>&#x2013;<lpage>521</lpage>. <pub-id pub-id-type="doi">10.1016/j.protis.2015.07.005</pub-id> <pub-id pub-id-type="pmid">26386358</pub-id></citation></ref>
<ref id="B109"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Teichmann</surname> <given-names>S. A.</given-names></name> <name><surname>Babu</surname> <given-names>M. M.</given-names></name></person-group> (<year>2002</year>). <article-title>Conservation of gene co-regulation in prokaryotes and eukaryotes.</article-title> <source><italic>Trends Biotechnol.</italic></source> <volume>20</volume> <fpage>407</fpage>&#x2013;<lpage>410</lpage>. <pub-id pub-id-type="doi">10.1016/s0167-7799(02)02032-2</pub-id></citation></ref>
<ref id="B110"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Tsai</surname> <given-names>M.-C.</given-names></name> <name><surname>Manor</surname> <given-names>O.</given-names></name> <name><surname>Wan</surname> <given-names>Y.</given-names></name> <name><surname>Mosammaparast</surname> <given-names>N.</given-names></name> <name><surname>Wang</surname> <given-names>J. K.</given-names></name> <name><surname>Lan</surname> <given-names>F.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Long noncoding RNA as modular scaffold of histone modification complexes.</article-title> <source><italic>Science</italic></source> <volume>329</volume> <fpage>689</fpage>&#x2013;<lpage>693</lpage>. <pub-id pub-id-type="doi">10.1126/science.1192002</pub-id> <pub-id pub-id-type="pmid">20616235</pub-id></citation></ref>
<ref id="B111"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Valenzuela</surname> <given-names>J.</given-names></name> <name><surname>Mazurie</surname> <given-names>A.</given-names></name> <name><surname>Carlson</surname> <given-names>R. P.</given-names></name> <name><surname>Gerlach</surname> <given-names>R.</given-names></name> <name><surname>Cooksey</surname> <given-names>K. E.</given-names></name> <name><surname>Peyton</surname> <given-names>B. M.</given-names></name><etal/></person-group> (<year>2012</year>). <article-title>Potential role of multiple carbon fixation pathways during lipid accumulation in <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Biotechnol. Biofuels</italic></source> <volume>5</volume>:<issue>40</issue>. <pub-id pub-id-type="doi">10.1186/1754-6834-5-40</pub-id> <pub-id pub-id-type="pmid">22672912</pub-id></citation></ref>
<ref id="B112"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Valle</surname> <given-names>K. C.</given-names></name> <name><surname>Nymark</surname> <given-names>M.</given-names></name> <name><surname>Aamot</surname> <given-names>I.</given-names></name> <name><surname>Hancke</surname> <given-names>K.</given-names></name> <name><surname>Winge</surname> <given-names>P.</given-names></name> <name><surname>Andresen</surname> <given-names>K.</given-names></name><etal/></person-group> (<year>2014</year>). <article-title>System responses to equal doses of photosynthetically usable radiation of blue, green and red light in the marine diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>PLoS One</italic></source> <volume>9</volume>:<issue>e114211</issue>. <pub-id pub-id-type="doi">10.1371/journal.pone.0114211</pub-id> <pub-id pub-id-type="pmid">25470731</pub-id></citation></ref>
<ref id="B113"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Veluchamy</surname> <given-names>A.</given-names></name> <name><surname>Lin</surname> <given-names>X.</given-names></name> <name><surname>Maumus</surname> <given-names>F.</given-names></name> <name><surname>Rivarola</surname> <given-names>M.</given-names></name> <name><surname>Bhavsar</surname> <given-names>J.</given-names></name> <name><surname>Creasy</surname> <given-names>T.</given-names></name><etal/></person-group> (<year>2013</year>). <article-title>Insights into the role of DNA methylation in diatoms by genome-wide profiling in <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Nat. Commun.</italic></source> <volume>4</volume>:<issue>2091</issue>. <pub-id pub-id-type="doi">10.1038/ncomms3091</pub-id> <pub-id pub-id-type="pmid">23820484</pub-id></citation></ref>
<ref id="B114"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Veluchamy</surname> <given-names>A.</given-names></name> <name><surname>Rastogi</surname> <given-names>A.</given-names></name> <name><surname>Lin</surname> <given-names>X.</given-names></name> <name><surname>Lombard</surname> <given-names>B.</given-names></name> <name><surname>Murik</surname> <given-names>O.</given-names></name> <name><surname>Thomas</surname> <given-names>Y.</given-names></name><etal/></person-group> (<year>2015</year>). <article-title>An integrative analysis of post-translational histone modifications in the marine diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Genom. Biol.</italic></source> <volume>16</volume>:<issue>102</issue>. <pub-id pub-id-type="doi">10.1186/s13059-015-0671-8</pub-id> <pub-id pub-id-type="pmid">25990474</pub-id></citation></ref>
<ref id="B115"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Walker</surname> <given-names>G.</given-names></name> <name><surname>Dorrell</surname> <given-names>R. G.</given-names></name> <name><surname>Schlacht</surname> <given-names>A.</given-names></name> <name><surname>Dacks</surname> <given-names>J. B.</given-names></name></person-group> (<year>2011</year>). <article-title>Eukaryotic systematics: a user&#x2019;s guide for cell biologists and parasitologists.</article-title> <source><italic>Parasitology</italic></source> <volume>138</volume> <fpage>1638</fpage>&#x2013;<lpage>1663</lpage>. <pub-id pub-id-type="doi">10.1017/S0031182010001708</pub-id> <pub-id pub-id-type="pmid">21320384</pub-id></citation></ref>
<ref id="B116"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>P.</given-names></name> <name><surname>Gao</surname> <given-names>J.</given-names></name> <name><surname>Wan</surname> <given-names>C.</given-names></name> <name><surname>Zhang</surname> <given-names>F.</given-names></name> <name><surname>Xu</surname> <given-names>Z.</given-names></name> <name><surname>Huang</surname> <given-names>X.</given-names></name><etal/></person-group> (<year>2010</year>). <article-title>Divinyl chlorophyll(ide) a can be converted to monovinyl chlorophyll(ide) a by a divinyl reductase in rice.</article-title> <source><italic>Plant Physiol.</italic></source> <volume>153</volume> <fpage>994</fpage>&#x2013;<lpage>1003</lpage>. <pub-id pub-id-type="doi">10.1104/pp.110.158477</pub-id> <pub-id pub-id-type="pmid">20484022</pub-id></citation></ref>
<ref id="B117"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wang</surname> <given-names>Y.</given-names></name> <name><surname>Jensen</surname> <given-names>L.</given-names></name> <name><surname>H&#x00F8;jrup</surname> <given-names>P.</given-names></name> <name><surname>Morse</surname> <given-names>D.</given-names></name></person-group> (<year>2005</year>). <article-title>Synthesis and degradation of dinoflagellate plastid-encoded psbA proteins are light-regulated, not circadian-regulated.</article-title> <source><italic>Proc. Natl. Acad. Sci. U.S.A.</italic></source> <volume>102</volume> <fpage>2844</fpage>&#x2013;<lpage>2849</lpage>. <pub-id pub-id-type="doi">10.1073/pnas.0406522102</pub-id> <pub-id pub-id-type="pmid">15703299</pub-id></citation></ref>
<ref id="B118"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Wheeler</surname> <given-names>D. L.</given-names></name> <name><surname>Barrett</surname> <given-names>T.</given-names></name> <name><surname>Benson</surname> <given-names>D. A.</given-names></name> <name><surname>Bryant</surname> <given-names>S. H.</given-names></name> <name><surname>Canese</surname> <given-names>K.</given-names></name> <name><surname>Chetvernin</surname> <given-names>V.</given-names></name><etal/></person-group> (<year>2006</year>). <article-title>Database resources of the National Center for Biotechnology Information.</article-title> <source><italic>Nucl. Acids Res.</italic></source> <volume>34</volume> <fpage>173</fpage>&#x2013;<lpage>180</lpage>. <pub-id pub-id-type="doi">10.1093/nar/gkj158</pub-id> <pub-id pub-id-type="pmid">16381840</pub-id></citation></ref>
<ref id="B119"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Yu</surname> <given-names>M.</given-names></name> <name><surname>Ashworth</surname> <given-names>M. P.</given-names></name> <name><surname>Hajrah</surname> <given-names>N. H.</given-names></name> <name><surname>Khiyami</surname> <given-names>M. A.</given-names></name> <name><surname>Sabir</surname> <given-names>M. J.</given-names></name> <name><surname>Alhebshi</surname> <given-names>A. M.</given-names></name><etal/></person-group> (<year>2018</year>). &#x201C;<article-title>Evolution of the plastid genomes in diatoms</article-title>,&#x201D; in <source><italic>Plastid Genome Evolution</italic></source>, <volume>Vol. 83</volume> <role>eds</role> <person-group person-group-type="editor"><name><surname>Chaw</surname> <given-names>S. M.</given-names></name> <name><surname>Jansen</surname> <given-names>R. K.</given-names></name></person-group> (<publisher-loc>Amsterdam</publisher-loc>: <publisher-name>Elsevier</publisher-name>), <fpage>129</fpage>&#x2013;<lpage>155</lpage>. <pub-id pub-id-type="doi">10.1016/bs.abr.2017.11.009</pub-id></citation></ref>
<ref id="B120"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>W.</given-names></name> <name><surname>Langfelder</surname> <given-names>P.</given-names></name> <name><surname>Fuller</surname> <given-names>T.</given-names></name> <name><surname>Dong</surname> <given-names>J.</given-names></name> <name><surname>Li</surname> <given-names>A.</given-names></name> <name><surname>Horvath</surname> <given-names>S.</given-names></name></person-group> (<year>2010</year>). <article-title>Weighted gene coexpression network analysis: state of the art.</article-title> <source><italic>J. Biopharm. Stat.</italic></source> <volume>20</volume> <fpage>281</fpage>&#x2013;<lpage>300</lpage>. <pub-id pub-id-type="doi">10.1080/10543400903572753</pub-id> <pub-id pub-id-type="pmid">20309759</pub-id></citation></ref>
<ref id="B121"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zhao</surname> <given-names>X.</given-names></name> <name><surname>Deton Cabanillas</surname> <given-names>A.-F.</given-names></name> <name><surname>Veluchamy</surname> <given-names>A.</given-names></name> <name><surname>Bowler</surname> <given-names>C.</given-names></name> <name><surname>Vieira</surname> <given-names>F. R. J.</given-names></name> <name><surname>Tirichine</surname> <given-names>L.</given-names></name></person-group> (<year>2020</year>). <article-title>Probing the diversity of Polycomb and Trithorax proteins in cultured and environmentally sampled microalgae.</article-title> <source><italic>Front. Mar. Sci.</italic></source> <volume>7</volume>:<issue>3389</issue>. <pub-id pub-id-type="doi">10.3389/fmars.2020.00189</pub-id></citation></ref>
<ref id="B122"><citation citation-type="journal"><person-group person-group-type="author"><name><surname>Zheng</surname> <given-names>Y. T.</given-names></name> <name><surname>Quinn</surname> <given-names>A. H.</given-names></name> <name><surname>Sriram</surname> <given-names>G.</given-names></name></person-group> (<year>2013</year>). <article-title>Experimental evidence and isotopomer analysis of mixotrophic glucose metabolism in the marine diatom <italic>Phaeodactylum tricornutum</italic>.</article-title> <source><italic>Microb. Cell Fact.</italic></source> <volume>12</volume>:<issue>109</issue>. <pub-id pub-id-type="doi">10.1186/1475-2859-12-109</pub-id> <pub-id pub-id-type="pmid">24228629</pub-id></citation></ref>
</ref-list><fn-group>
<fn id="footnote1">
<label>1</label>
<p><ext-link ext-link-type="uri" xlink:href="http://www.ncbi.nlm.nih.gov/Traces/sra/">http://www.ncbi.nlm.nih.gov/Traces/sra/</ext-link></p></fn>
<fn id="footnote2">
<label>2</label>
<p><ext-link ext-link-type="uri" xlink:href="https://www.bioinformatics.babraham.ac.uk/projects/fastqc/">https://www.bioinformatics.babraham.ac.uk/projects/fastqc/</ext-link></p></fn>
<fn id="footnote3">
<label>3</label>
<p><ext-link ext-link-type="uri" xlink:href="http://www.bioinformatics.babraham.ac.uk/projects/trim_galore/">http://www.bioinformatics.babraham.ac.uk/projects/trim_galore/</ext-link></p></fn>
</fn-group>
</back>
</article>